[clang] [llvm] [X86][AVX10.2-BF16] Remove [NE]P from intrinsic and instruction name (PR #123335)
Phoebe Wang via llvm-commits
llvm-commits at lists.llvm.org
Fri Jan 17 05:27:44 PST 2025
https://github.com/phoebewang created https://github.com/llvm/llvm-project/pull/123335
Ref.: https://cdrdv2.intel.com/v1/dl/getContent/828965
>From ef979383a507277247d36b97572f4bf558e84305 Mon Sep 17 00:00:00 2001
From: "Wang, Phoebe" <phoebe.wang at intel.com>
Date: Fri, 17 Jan 2025 21:25:19 +0800
Subject: [PATCH] [X86][AVX10.2-BF16] Remove [NE]P from intrinsic and
instruction name
Ref.: https://cdrdv2.intel.com/v1/dl/getContent/828965
---
clang/include/clang/Basic/BuiltinsX86.td | 96 +-
clang/lib/CodeGen/CGBuiltin.cpp | 30 +-
clang/lib/Headers/avx10_2_512bf16intrin.h | 210 +-
clang/lib/Headers/avx10_2bf16intrin.h | 426 ++-
clang/lib/Sema/SemaX86.cpp | 18 +-
.../CodeGen/X86/avx10_2_512bf16-builtins.c | 300 +-
clang/test/CodeGen/X86/avx10_2bf16-builtins.c | 546 +--
llvm/include/llvm/IR/IntrinsicsX86.td | 156 +-
.../lib/Target/X86/AsmParser/X86AsmParser.cpp | 8 +-
.../X86/MCTargetDesc/X86ATTInstPrinter.cpp | 18 +-
.../X86/MCTargetDesc/X86InstComments.cpp | 4 +-
.../X86/MCTargetDesc/X86InstPrinterCommon.cpp | 20 +-
.../X86/MCTargetDesc/X86IntelInstPrinter.cpp | 18 +-
llvm/lib/Target/X86/X86InstrAVX10.td | 140 +-
llvm/lib/Target/X86/X86InstrFMA3Info.cpp | 4 +-
llvm/lib/Target/X86/X86InstrUtils.td | 6 +-
llvm/lib/Target/X86/X86IntrinsicsInfo.h | 54 +-
llvm/test/CodeGen/X86/avx10.2-fma-commute.ll | 216 +-
.../test/CodeGen/X86/avx10_2_512bf16-arith.ll | 220 +-
.../CodeGen/X86/avx10_2_512bf16-intrinsics.ll | 194 +-
llvm/test/CodeGen/X86/avx10_2bf16-arith.ll | 444 +--
.../CodeGen/X86/avx10_2bf16-intrinsics.ll | 444 +--
.../MC/Disassembler/X86/avx10.2-bf16-32.txt | 2984 ++++++++---------
.../MC/Disassembler/X86/avx10.2-bf16-64.txt | 2984 ++++++++---------
llvm/test/MC/X86/avx10.2-bf16-32-att.s | 2984 ++++++++---------
llvm/test/MC/X86/avx10.2-bf16-32-intel.s | 2984 ++++++++---------
llvm/test/MC/X86/avx10.2-bf16-64-att.s | 2984 ++++++++---------
llvm/test/MC/X86/avx10.2-bf16-64-intel.s | 2984 ++++++++---------
llvm/test/TableGen/x86-fold-tables.inc | 984 +++---
29 files changed, 11225 insertions(+), 11235 deletions(-)
diff --git a/clang/include/clang/Basic/BuiltinsX86.td b/clang/include/clang/Basic/BuiltinsX86.td
index 18fc10eb85c027..32d5486f162b38 100644
--- a/clang/include/clang/Basic/BuiltinsX86.td
+++ b/clang/include/clang/Basic/BuiltinsX86.td
@@ -5304,75 +5304,75 @@ let Features = "avx10.2-256", Attributes = [NoThrow, RequiredVectorWidth<128>] i
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vaddnepbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">;
+ def vaddbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vaddnepbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">;
+ def vaddbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vaddnepbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">;
+ def vaddbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vdivnepbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">;
+ def vdivbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vdivnepbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">;
+ def vdivbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vdivnepbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">;
+ def vdivbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vmaxpbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">;
+ def vmaxbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vmaxpbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">;
+ def vmaxbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vmaxpbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">;
+ def vmaxbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vminpbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">;
+ def vminbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vminpbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">;
+ def vminbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vminpbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">;
+ def vminbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vmulnepbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">;
+ def vmulbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vmulnepbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">;
+ def vmulbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vmulnepbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">;
+ def vmulbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vsubnepbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">;
+ def vsubbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vsubnepbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">;
+ def vsubbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vsubnepbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">;
+ def vsubbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
@@ -5385,120 +5385,120 @@ let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vcmppbf16512_mask : X86Builtin<"unsigned int(_Vector<32, __bf16>, _Vector<32, __bf16>, _Constant int, unsigned int)">;
+ def vcmpbf16512_mask : X86Builtin<"unsigned int(_Vector<32, __bf16>, _Vector<32, __bf16>, _Constant int, unsigned int)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vcmppbf16256_mask : X86Builtin<"unsigned short(_Vector<16, __bf16>, _Vector<16, __bf16>, _Constant int, unsigned short)">;
+ def vcmpbf16256_mask : X86Builtin<"unsigned short(_Vector<16, __bf16>, _Vector<16, __bf16>, _Constant int, unsigned short)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vcmppbf16128_mask : X86Builtin<"unsigned char(_Vector<8, __bf16>, _Vector<8, __bf16>, _Constant int, unsigned char)">;
- def vfpclasspbf16128_mask : X86Builtin<"unsigned char(_Vector<8, __bf16>, _Constant int, unsigned char)">;
+ def vcmpbf16128_mask : X86Builtin<"unsigned char(_Vector<8, __bf16>, _Vector<8, __bf16>, _Constant int, unsigned char)">;
+ def vfpclassbf16128_mask : X86Builtin<"unsigned char(_Vector<8, __bf16>, _Constant int, unsigned char)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vfpclasspbf16256_mask : X86Builtin<"unsigned short(_Vector<16, __bf16>, _Constant int, unsigned short)">;
+ def vfpclassbf16256_mask : X86Builtin<"unsigned short(_Vector<16, __bf16>, _Constant int, unsigned short)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vfpclasspbf16512_mask : X86Builtin<"unsigned int(_Vector<32, __bf16>, _Constant int, unsigned int)">;
+ def vfpclassbf16512_mask : X86Builtin<"unsigned int(_Vector<32, __bf16>, _Constant int, unsigned int)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vscalefpbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">;
+ def vscalefbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vscalefpbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">;
+ def vscalefbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vscalefpbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">;
+ def vscalefbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vrcppbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">;
+ def vrcpbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vrcppbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">;
+ def vrcpbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vrcppbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">;
+ def vrcpbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vgetexppbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">;
+ def vgetexpbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vgetexppbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">;
+ def vgetexpbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vgetexppbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">;
+ def vgetexpbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vrsqrtpbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">;
+ def vrsqrtbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vrsqrtpbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">;
+ def vrsqrtbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vrsqrtpbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">;
+ def vrsqrtbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vreducenepbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Constant int, _Vector<8, __bf16>, unsigned char)">;
+ def vreducebf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Constant int, _Vector<8, __bf16>, unsigned char)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vreducenepbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Constant int, _Vector<16, __bf16>, unsigned short)">;
+ def vreducebf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Constant int, _Vector<16, __bf16>, unsigned short)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vreducenepbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Constant int, _Vector<32, __bf16>, unsigned int)">;
+ def vreducebf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Constant int, _Vector<32, __bf16>, unsigned int)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vrndscalenepbf16_128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Constant int, _Vector<8, __bf16>, unsigned char)">;
+ def vrndscalebf16_128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Constant int, _Vector<8, __bf16>, unsigned char)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vrndscalenepbf16_256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Constant int, _Vector<16, __bf16>, unsigned short)">;
+ def vrndscalebf16_256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Constant int, _Vector<16, __bf16>, unsigned short)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vrndscalenepbf16_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Constant int, _Vector<32, __bf16>, unsigned int)">;
+ def vrndscalebf16_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Constant int, _Vector<32, __bf16>, unsigned int)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vgetmantpbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Constant int, _Vector<8, __bf16>, unsigned char)">;
+ def vgetmantbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Constant int, _Vector<8, __bf16>, unsigned char)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vgetmantpbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Constant int, _Vector<16, __bf16>, unsigned short)">;
+ def vgetmantbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Constant int, _Vector<16, __bf16>, unsigned short)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vgetmantpbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Constant int, _Vector<32, __bf16>, unsigned int)">;
+ def vgetmantbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Constant int, _Vector<32, __bf16>, unsigned int)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in {
- def vsqrtnepbf16 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>)">;
+ def vsqrtbf16 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>)">;
}
let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in {
- def vsqrtnepbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>)">;
+ def vsqrtbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>)">;
}
let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in {
- def vsqrtnepbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>)">;
+ def vsqrtbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>)">;
def vfmaddnepbh512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, _Vector<32, __bf16>)">;
}
diff --git a/clang/lib/CodeGen/CGBuiltin.cpp b/clang/lib/CodeGen/CGBuiltin.cpp
index 2385f2a320b625..4160a5b8b59bfd 100644
--- a/clang/lib/CodeGen/CGBuiltin.cpp
+++ b/clang/lib/CodeGen/CGBuiltin.cpp
@@ -16661,9 +16661,9 @@ Value *CodeGenFunction::EmitX86BuiltinExpr(unsigned BuiltinID,
case X86::BI__builtin_ia32_sqrtph256:
case X86::BI__builtin_ia32_sqrtph:
case X86::BI__builtin_ia32_sqrtph512:
- case X86::BI__builtin_ia32_vsqrtnepbf16256:
- case X86::BI__builtin_ia32_vsqrtnepbf16:
- case X86::BI__builtin_ia32_vsqrtnepbf16512:
+ case X86::BI__builtin_ia32_vsqrtbf16256:
+ case X86::BI__builtin_ia32_vsqrtbf16:
+ case X86::BI__builtin_ia32_vsqrtbf16512:
case X86::BI__builtin_ia32_sqrtps512:
case X86::BI__builtin_ia32_sqrtpd512: {
if (Ops.size() == 2) {
@@ -16883,9 +16883,9 @@ Value *CodeGenFunction::EmitX86BuiltinExpr(unsigned BuiltinID,
case X86::BI__builtin_ia32_fpclassps128_mask:
case X86::BI__builtin_ia32_fpclassps256_mask:
case X86::BI__builtin_ia32_fpclassps512_mask:
- case X86::BI__builtin_ia32_vfpclasspbf16128_mask:
- case X86::BI__builtin_ia32_vfpclasspbf16256_mask:
- case X86::BI__builtin_ia32_vfpclasspbf16512_mask:
+ case X86::BI__builtin_ia32_vfpclassbf16128_mask:
+ case X86::BI__builtin_ia32_vfpclassbf16256_mask:
+ case X86::BI__builtin_ia32_vfpclassbf16512_mask:
case X86::BI__builtin_ia32_fpclassph128_mask:
case X86::BI__builtin_ia32_fpclassph256_mask:
case X86::BI__builtin_ia32_fpclassph512_mask:
@@ -16900,14 +16900,14 @@ Value *CodeGenFunction::EmitX86BuiltinExpr(unsigned BuiltinID,
Intrinsic::ID ID;
switch (BuiltinID) {
default: llvm_unreachable("Unsupported intrinsic!");
- case X86::BI__builtin_ia32_vfpclasspbf16128_mask:
- ID = Intrinsic::x86_avx10_fpclass_nepbf16_128;
+ case X86::BI__builtin_ia32_vfpclassbf16128_mask:
+ ID = Intrinsic::x86_avx10_fpclass_bf16_128;
break;
- case X86::BI__builtin_ia32_vfpclasspbf16256_mask:
- ID = Intrinsic::x86_avx10_fpclass_nepbf16_256;
+ case X86::BI__builtin_ia32_vfpclassbf16256_mask:
+ ID = Intrinsic::x86_avx10_fpclass_bf16_256;
break;
- case X86::BI__builtin_ia32_vfpclasspbf16512_mask:
- ID = Intrinsic::x86_avx10_fpclass_nepbf16_512;
+ case X86::BI__builtin_ia32_vfpclassbf16512_mask:
+ ID = Intrinsic::x86_avx10_fpclass_bf16_512;
break;
case X86::BI__builtin_ia32_fpclassph128_mask:
ID = Intrinsic::x86_avx512fp16_fpclass_ph_128;
@@ -17067,9 +17067,9 @@ Value *CodeGenFunction::EmitX86BuiltinExpr(unsigned BuiltinID,
case X86::BI__builtin_ia32_vcmppd256_round_mask:
case X86::BI__builtin_ia32_vcmpps256_round_mask:
case X86::BI__builtin_ia32_vcmpph256_round_mask:
- case X86::BI__builtin_ia32_vcmppbf16512_mask:
- case X86::BI__builtin_ia32_vcmppbf16256_mask:
- case X86::BI__builtin_ia32_vcmppbf16128_mask:
+ case X86::BI__builtin_ia32_vcmpbf16512_mask:
+ case X86::BI__builtin_ia32_vcmpbf16256_mask:
+ case X86::BI__builtin_ia32_vcmpbf16128_mask:
IsMaskFCmp = true;
[[fallthrough]];
case X86::BI__builtin_ia32_cmpps:
diff --git a/clang/lib/Headers/avx10_2_512bf16intrin.h b/clang/lib/Headers/avx10_2_512bf16intrin.h
index 392b7ae770c5b5..ce43ecbcfe047c 100644
--- a/clang/lib/Headers/avx10_2_512bf16intrin.h
+++ b/clang/lib/Headers/avx10_2_512bf16intrin.h
@@ -62,17 +62,17 @@ static __inline __m512bh __DEFAULT_FN_ATTRS512 _mm512_set_pbh(
(bf3), (bf2), (bf1))
static __inline__ __m512 __DEFAULT_FN_ATTRS512
-_mm512_castpbf16_ps(__m512bh __a) {
+_mm512_castbf16_ps(__m512bh __a) {
return (__m512)__a;
}
static __inline__ __m512d __DEFAULT_FN_ATTRS512
-_mm512_castpbf16_pd(__m512bh __a) {
+_mm512_castbf16_pd(__m512bh __a) {
return (__m512d)__a;
}
static __inline__ __m512i __DEFAULT_FN_ATTRS512
-_mm512_castpbf16_si512(__m512bh __a) {
+_mm512_castbf16_si512(__m512bh __a) {
return (__m512i)__a;
}
@@ -91,39 +91,39 @@ _mm512_castsi512_pbh(__m512i __a) {
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS512
-_mm512_castpbf16512_pbh128(__m512bh __a) {
+_mm512_castbf16512_pbh128(__m512bh __a) {
return __builtin_shufflevector(__a, __a, 0, 1, 2, 3, 4, 5, 6, 7);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS512
-_mm512_castpbf16512_pbh256(__m512bh __a) {
+_mm512_castbf16512_pbh256(__m512bh __a) {
return __builtin_shufflevector(__a, __a, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11,
12, 13, 14, 15);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_castpbf16128_pbh512(__m128bh __a) {
+_mm512_castbf16128_pbh512(__m128bh __a) {
return __builtin_shufflevector(__a, __a, 0, 1, 2, 3, 4, 5, 6, 7, -1, -1, -1,
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
-1, -1, -1, -1, -1, -1, -1, -1, -1);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_castpbf16256_pbh512(__m256bh __a) {
+_mm512_castbf16256_pbh512(__m256bh __a) {
return __builtin_shufflevector(__a, __a, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11,
12, 13, 14, 15, -1, -1, -1, -1, -1, -1, -1, -1,
-1, -1, -1, -1, -1, -1, -1, -1);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_zextpbf16128_pbh512(__m128bh __a) {
+_mm512_zextbf16128_pbh512(__m128bh __a) {
return __builtin_shufflevector(
__a, (__v8bf)_mm_setzero_pbh(), 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12,
13, 14, 15, 8, 9, 10, 11, 12, 13, 14, 15, 8, 9, 10, 11, 12, 13, 14, 15);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_zextpbf16256_pbh512(__m256bh __a) {
+_mm512_zextbf16256_pbh512(__m256bh __a) {
return __builtin_shufflevector(__a, (__v16bf)_mm256_setzero_pbh(), 0, 1, 2, 3,
4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16,
17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28,
@@ -178,81 +178,81 @@ _mm512_permutexvar_pbh(__m512i __A, __m512bh __B) {
return (__m512bh)__builtin_ia32_permvarhi512((__v32hi)__B, (__v32hi)__A);
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_addne_pbh(__m512bh __A, __m512bh __B) {
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_add_pbh(__m512bh __A,
+ __m512bh __B) {
return (__m512bh)((__v32bf)__A + (__v32bf)__B);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_mask_addne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
+_mm512_mask_add_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
return (__m512bh)__builtin_ia32_selectpbf_512(
- (__mmask32)__U, (__v32bf)_mm512_addne_pbh(__A, __B), (__v32bf)__W);
+ (__mmask32)__U, (__v32bf)_mm512_add_pbh(__A, __B), (__v32bf)__W);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_maskz_addne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
+_mm512_maskz_add_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
return (__m512bh)__builtin_ia32_selectpbf_512(
- (__mmask32)__U, (__v32bf)_mm512_addne_pbh(__A, __B),
+ (__mmask32)__U, (__v32bf)_mm512_add_pbh(__A, __B),
(__v32bf)_mm512_setzero_pbh());
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_subne_pbh(__m512bh __A, __m512bh __B) {
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_sub_pbh(__m512bh __A,
+ __m512bh __B) {
return (__m512bh)((__v32bf)__A - (__v32bf)__B);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_mask_subne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
+_mm512_mask_sub_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
return (__m512bh)__builtin_ia32_selectpbf_512(
- (__mmask32)__U, (__v32bf)_mm512_subne_pbh(__A, __B), (__v32bf)__W);
+ (__mmask32)__U, (__v32bf)_mm512_sub_pbh(__A, __B), (__v32bf)__W);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_maskz_subne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
+_mm512_maskz_sub_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
return (__m512bh)__builtin_ia32_selectpbf_512(
- (__mmask32)__U, (__v32bf)_mm512_subne_pbh(__A, __B),
+ (__mmask32)__U, (__v32bf)_mm512_sub_pbh(__A, __B),
(__v32bf)_mm512_setzero_pbh());
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_mulne_pbh(__m512bh __A, __m512bh __B) {
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mul_pbh(__m512bh __A,
+ __m512bh __B) {
return (__m512bh)((__v32bf)__A * (__v32bf)__B);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_mask_mulne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
+_mm512_mask_mul_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
return (__m512bh)__builtin_ia32_selectpbf_512(
- (__mmask32)__U, (__v32bf)_mm512_mulne_pbh(__A, __B), (__v32bf)__W);
+ (__mmask32)__U, (__v32bf)_mm512_mul_pbh(__A, __B), (__v32bf)__W);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_maskz_mulne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
+_mm512_maskz_mul_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
return (__m512bh)__builtin_ia32_selectpbf_512(
- (__mmask32)__U, (__v32bf)_mm512_mulne_pbh(__A, __B),
+ (__mmask32)__U, (__v32bf)_mm512_mul_pbh(__A, __B),
(__v32bf)_mm512_setzero_pbh());
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_divne_pbh(__m512bh __A, __m512bh __B) {
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_div_pbh(__m512bh __A,
+ __m512bh __B) {
return (__m512bh)((__v32bf)__A / (__v32bf)__B);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_mask_divne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
+_mm512_mask_div_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
return (__m512bh)__builtin_ia32_selectpbf_512(
- (__mmask32)__U, (__v32bf)_mm512_divne_pbh(__A, __B), (__v32bf)__W);
+ (__mmask32)__U, (__v32bf)_mm512_div_pbh(__A, __B), (__v32bf)__W);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_maskz_divne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
+_mm512_maskz_div_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
return (__m512bh)__builtin_ia32_selectpbf_512(
- (__mmask32)__U, (__v32bf)_mm512_divne_pbh(__A, __B),
+ (__mmask32)__U, (__v32bf)_mm512_div_pbh(__A, __B),
(__v32bf)_mm512_setzero_pbh());
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_max_pbh(__m512bh __A,
__m512bh __B) {
- return (__m512bh)__builtin_ia32_vmaxpbf16512((__v32bf)__A, (__v32bf)__B);
+ return (__m512bh)__builtin_ia32_vmaxbf16512((__v32bf)__A, (__v32bf)__B);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
@@ -270,7 +270,7 @@ _mm512_maskz_max_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_min_pbh(__m512bh __A,
__m512bh __B) {
- return (__m512bh)__builtin_ia32_vminpbf16512((__v32bf)__A, (__v32bf)__B);
+ return (__m512bh)__builtin_ia32_vminbf16512((__v32bf)__A, (__v32bf)__B);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
@@ -287,143 +287,143 @@ _mm512_maskz_min_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
}
#define _mm512_cmp_pbh_mask(__A, __B, __P) \
- ((__mmask32)__builtin_ia32_vcmppbf16512_mask((__v32bf)(__m512bh)(__A), \
- (__v32bf)(__m512bh)(__B), \
- (int)(__P), (__mmask32) - 1))
+ ((__mmask32)__builtin_ia32_vcmpbf16512_mask((__v32bf)(__m512bh)(__A), \
+ (__v32bf)(__m512bh)(__B), \
+ (int)(__P), (__mmask32) - 1))
#define _mm512_mask_cmp_pbh_mask(__U, __A, __B, __P) \
- ((__mmask32)__builtin_ia32_vcmppbf16512_mask((__v32bf)(__m512bh)(__A), \
- (__v32bf)(__m512bh)(__B), \
- (int)(__P), (__mmask32)(__U)))
+ ((__mmask32)__builtin_ia32_vcmpbf16512_mask((__v32bf)(__m512bh)(__A), \
+ (__v32bf)(__m512bh)(__B), \
+ (int)(__P), (__mmask32)(__U)))
#define _mm512_mask_fpclass_pbh_mask(__U, __A, imm) \
- ((__mmask32)__builtin_ia32_vfpclasspbf16512_mask( \
+ ((__mmask32)__builtin_ia32_vfpclassbf16512_mask( \
(__v32bf)(__m512bh)(__A), (int)(imm), (__mmask32)(__U)))
#define _mm512_fpclass_pbh_mask(__A, imm) \
- ((__mmask32)__builtin_ia32_vfpclasspbf16512_mask( \
+ ((__mmask32)__builtin_ia32_vfpclassbf16512_mask( \
(__v32bf)(__m512bh)(__A), (int)(imm), (__mmask32) - 1))
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
_mm512_scalef_pbh(__m512bh __A, __m512bh __B) {
- return (__m512bh)__builtin_ia32_vscalefpbf16512_mask(
+ return (__m512bh)__builtin_ia32_vscalefbf16512_mask(
(__v32bf)__A, (__v32bf)__B, (__v32bf)_mm512_undefined_pbh(),
(__mmask32)-1);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_scalef_pbh(
__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
- return (__m512bh)__builtin_ia32_vscalefpbf16512_mask(
+ return (__m512bh)__builtin_ia32_vscalefbf16512_mask(
(__v32bf)__A, (__v32bf)__B, (__v32bf)__W, (__mmask32)__U);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
_mm512_maskz_scalef_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
- return (__m512bh)__builtin_ia32_vscalefpbf16512_mask(
+ return (__m512bh)__builtin_ia32_vscalefbf16512_mask(
(__v32bf)__A, (__v32bf)__B, (__v32bf)_mm512_setzero_pbh(),
(__mmask32)__U);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_rcp_pbh(__m512bh __A) {
- return (__m512bh)__builtin_ia32_vrcppbf16512_mask(
+ return (__m512bh)__builtin_ia32_vrcpbf16512_mask(
(__v32bf)__A, (__v32bf)_mm512_undefined_pbh(), (__mmask32)-1);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
_mm512_mask_rcp_pbh(__m512bh __W, __mmask32 __U, __m512bh __A) {
- return (__m512bh)__builtin_ia32_vrcppbf16512_mask((__v32bf)__A, (__v32bf)__W,
- (__mmask32)__U);
+ return (__m512bh)__builtin_ia32_vrcpbf16512_mask((__v32bf)__A, (__v32bf)__W,
+ (__mmask32)__U);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
_mm512_maskz_rcp_pbh(__mmask32 __U, __m512bh __A) {
- return (__m512bh)__builtin_ia32_vrcppbf16512_mask(
+ return (__m512bh)__builtin_ia32_vrcpbf16512_mask(
(__v32bf)__A, (__v32bf)_mm512_setzero_pbh(), (__mmask32)__U);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
_mm512_getexp_pbh(__m512bh __A) {
- return (__m512bh)__builtin_ia32_vgetexppbf16512_mask(
+ return (__m512bh)__builtin_ia32_vgetexpbf16512_mask(
(__v32bf)__A, (__v32bf)_mm512_undefined_pbh(), (__mmask32)-1);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
_mm512_mask_getexp_pbh(__m512bh __W, __mmask32 __U, __m512bh __A) {
- return (__m512bh)__builtin_ia32_vgetexppbf16512_mask(
+ return (__m512bh)__builtin_ia32_vgetexpbf16512_mask(
(__v32bf)__A, (__v32bf)__W, (__mmask32)__U);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
_mm512_maskz_getexp_pbh(__mmask32 __U, __m512bh __A) {
- return (__m512bh)__builtin_ia32_vgetexppbf16512_mask(
+ return (__m512bh)__builtin_ia32_vgetexpbf16512_mask(
(__v32bf)__A, (__v32bf)_mm512_setzero_pbh(), (__mmask32)__U);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
_mm512_rsqrt_pbh(__m512bh __A) {
- return (__m512bh)__builtin_ia32_vrsqrtpbf16512_mask(
+ return (__m512bh)__builtin_ia32_vrsqrtbf16512_mask(
(__v32bf)__A, (__v32bf)_mm512_undefined_pbh(), (__mmask32)-1);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
_mm512_mask_rsqrt_pbh(__m512bh __W, __mmask32 __U, __m512bh __A) {
- return (__m512bh)__builtin_ia32_vrsqrtpbf16512_mask(
- (__v32bf)__A, (__v32bf)__W, (__mmask32)__U);
+ return (__m512bh)__builtin_ia32_vrsqrtbf16512_mask((__v32bf)__A, (__v32bf)__W,
+ (__mmask32)__U);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
_mm512_maskz_rsqrt_pbh(__mmask32 __U, __m512bh __A) {
- return (__m512bh)__builtin_ia32_vrsqrtpbf16512_mask(
+ return (__m512bh)__builtin_ia32_vrsqrtbf16512_mask(
(__v32bf)__A, (__v32bf)_mm512_setzero_pbh(), (__mmask32)__U);
}
-#define _mm512_reducene_pbh(__A, imm) \
- ((__m512bh)__builtin_ia32_vreducenepbf16512_mask( \
+#define _mm512_reduce_pbh(__A, imm) \
+ ((__m512bh)__builtin_ia32_vreducebf16512_mask( \
(__v32bf)(__m512bh)(__A), (int)(imm), (__v32bf)_mm512_undefined_pbh(), \
(__mmask32) - 1))
-#define _mm512_mask_reducene_pbh(__W, __U, __A, imm) \
- ((__m512bh)__builtin_ia32_vreducenepbf16512_mask( \
+#define _mm512_mask_reduce_pbh(__W, __U, __A, imm) \
+ ((__m512bh)__builtin_ia32_vreducebf16512_mask( \
(__v32bf)(__m512bh)(__A), (int)(imm), (__v32bf)(__m512bh)(__W), \
(__mmask32)(__U)))
-#define _mm512_maskz_reducene_pbh(__U, __A, imm) \
- ((__m512bh)__builtin_ia32_vreducenepbf16512_mask( \
+#define _mm512_maskz_reduce_pbh(__U, __A, imm) \
+ ((__m512bh)__builtin_ia32_vreducebf16512_mask( \
(__v32bf)(__m512bh)(__A), (int)(imm), (__v32bf)_mm512_setzero_pbh(), \
(__mmask32)(__U)))
-#define _mm512_roundscalene_pbh(__A, imm) \
- ((__m512bh)__builtin_ia32_vrndscalenepbf16_mask( \
+#define _mm512_roundscale_pbh(__A, imm) \
+ ((__m512bh)__builtin_ia32_vrndscalebf16_mask( \
(__v32bf)(__m512bh)(__A), (int)(imm), (__v32bf)_mm512_setzero_pbh(), \
(__mmask32) - 1))
-#define _mm512_mask_roundscalene_pbh(__W, __U, __A, imm) \
- ((__m512bh)__builtin_ia32_vrndscalenepbf16_mask( \
+#define _mm512_mask_roundscale_pbh(__W, __U, __A, imm) \
+ ((__m512bh)__builtin_ia32_vrndscalebf16_mask( \
(__v32bf)(__m512bh)(__A), (int)(imm), (__v32bf)(__m512bh)(__W), \
(__mmask32)(__U)))
-#define _mm512_maskz_roundscalene_pbh(__U, __A, imm) \
- ((__m512bh)__builtin_ia32_vrndscalenepbf16_mask( \
+#define _mm512_maskz_roundscale_pbh(__U, __A, imm) \
+ ((__m512bh)__builtin_ia32_vrndscalebf16_mask( \
(__v32bf)(__m512bh)(__A), (int)(imm), (__v32bf)_mm512_setzero_pbh(), \
(__mmask32)(__U)))
#define _mm512_getmant_pbh(__A, __B, __C) \
- ((__m512bh)__builtin_ia32_vgetmantpbf16512_mask( \
+ ((__m512bh)__builtin_ia32_vgetmantbf16512_mask( \
(__v32bf)(__m512bh)(__A), (int)(((__C) << 2) | (__B)), \
(__v32bf)_mm512_undefined_pbh(), (__mmask32) - 1))
#define _mm512_mask_getmant_pbh(__W, __U, __A, __B, __C) \
- ((__m512bh)__builtin_ia32_vgetmantpbf16512_mask( \
+ ((__m512bh)__builtin_ia32_vgetmantbf16512_mask( \
(__v32bf)(__m512bh)(__A), (int)(((__C) << 2) | (__B)), \
(__v32bf)(__m512bh)(__W), (__mmask32)(__U)))
#define _mm512_maskz_getmant_pbh(__U, __A, __B, __C) \
- ((__m512bh)__builtin_ia32_vgetmantpbf16512_mask( \
+ ((__m512bh)__builtin_ia32_vgetmantbf16512_mask( \
(__v32bf)(__m512bh)(__A), (int)(((__C) << 2) | (__B)), \
(__v32bf)_mm512_setzero_pbh(), (__mmask32)(__U)))
static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_sqrt_pbh(__m512bh __A) {
- return (__m512bh)__builtin_ia32_vsqrtnepbf16512((__v32bf)__A);
+ return (__m512bh)__builtin_ia32_vsqrtbf16512((__v32bf)__A);
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
@@ -440,122 +440,118 @@ _mm512_maskz_sqrt_pbh(__mmask32 __U, __m512bh __A) {
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_fmaddne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
+_mm512_fmadd_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
return (__m512bh)__builtin_ia32_vfmaddnepbh512((__v32bf)__A, (__v32bf)__B,
(__v32bf)__C);
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_fmaddne_pbh(
- __m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) {
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512
+_mm512_mask_fmadd_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) {
return (__m512bh)__builtin_ia32_selectpbf_512(
(__mmask32)__U,
- _mm512_fmaddne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
- (__v32bf)__A);
+ _mm512_fmadd_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)__A);
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fmaddne_pbh(
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fmadd_pbh(
__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) {
return (__m512bh)__builtin_ia32_selectpbf_512(
(__mmask32)__U,
- _mm512_fmaddne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
- (__v32bf)__C);
+ _mm512_fmadd_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)__C);
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fmaddne_pbh(
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fmadd_pbh(
__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) {
return (__m512bh)__builtin_ia32_selectpbf_512(
(__mmask32)__U,
- _mm512_fmaddne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
+ _mm512_fmadd_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
(__v32bf)_mm512_setzero_pbh());
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_fmsubne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
+_mm512_fmsub_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
return (__m512bh)__builtin_ia32_vfmaddnepbh512((__v32bf)__A, (__v32bf)__B,
-(__v32bf)__C);
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_fmsubne_pbh(
- __m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) {
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512
+_mm512_mask_fmsub_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) {
return (__m512bh)__builtin_ia32_selectpbf_512(
(__mmask32)__U,
- _mm512_fmsubne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
- (__v32bf)__A);
+ _mm512_fmsub_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)__A);
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fmsubne_pbh(
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fmsub_pbh(
__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) {
return (__m512bh)__builtin_ia32_selectpbf_512(
(__mmask32)__U,
- _mm512_fmsubne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
- (__v32bf)__C);
+ _mm512_fmsub_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)__C);
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fmsubne_pbh(
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fmsub_pbh(
__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) {
return (__m512bh)__builtin_ia32_selectpbf_512(
(__mmask32)__U,
- _mm512_fmsubne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
+ _mm512_fmsub_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
(__v32bf)_mm512_setzero_pbh());
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_fnmaddne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
+_mm512_fnmadd_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
return (__m512bh)__builtin_ia32_vfmaddnepbh512((__v32bf)__A, -(__v32bf)__B,
(__v32bf)__C);
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_fnmaddne_pbh(
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_fnmadd_pbh(
__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) {
return (__m512bh)__builtin_ia32_selectpbf_512(
(__mmask32)__U,
- _mm512_fnmaddne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
+ _mm512_fnmadd_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
(__v32bf)__A);
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fnmaddne_pbh(
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fnmadd_pbh(
__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) {
return (__m512bh)__builtin_ia32_selectpbf_512(
(__mmask32)__U,
- _mm512_fnmaddne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
+ _mm512_fnmadd_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
(__v32bf)__C);
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fnmaddne_pbh(
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fnmadd_pbh(
__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) {
return (__m512bh)__builtin_ia32_selectpbf_512(
(__mmask32)__U,
- _mm512_fnmaddne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
+ _mm512_fnmadd_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
(__v32bf)_mm512_setzero_pbh());
}
static __inline__ __m512bh __DEFAULT_FN_ATTRS512
-_mm512_fnmsubne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
+_mm512_fnmsub_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
return (__m512bh)__builtin_ia32_vfmaddnepbh512((__v32bf)__A, -(__v32bf)__B,
-(__v32bf)__C);
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_fnmsubne_pbh(
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_fnmsub_pbh(
__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) {
return (__m512bh)__builtin_ia32_selectpbf_512(
(__mmask32)__U,
- _mm512_fnmsubne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
+ _mm512_fnmsub_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
(__v32bf)__A);
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fnmsubne_pbh(
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fnmsub_pbh(
__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) {
return (__m512bh)__builtin_ia32_selectpbf_512(
(__mmask32)__U,
- _mm512_fnmsubne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
+ _mm512_fnmsub_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
(__v32bf)__C);
}
-static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fnmsubne_pbh(
+static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fnmsub_pbh(
__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) {
return (__m512bh)__builtin_ia32_selectpbf_512(
(__mmask32)__U,
- _mm512_fnmsubne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
+ _mm512_fnmsub_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C),
(__v32bf)_mm512_setzero_pbh());
}
diff --git a/clang/lib/Headers/avx10_2bf16intrin.h b/clang/lib/Headers/avx10_2bf16intrin.h
index 0a427b9b7418b9..0f35f6e013707d 100644
--- a/clang/lib/Headers/avx10_2bf16intrin.h
+++ b/clang/lib/Headers/avx10_2bf16intrin.h
@@ -35,31 +35,31 @@ static __inline __m128bh __DEFAULT_FN_ATTRS128 _mm_setzero_pbh(void) {
return __builtin_bit_cast(__m128bh, _mm_setzero_ps());
}
-static __inline__ __m128 __DEFAULT_FN_ATTRS128 _mm_castpbf16_ps(__m128bh __a) {
+static __inline__ __m128 __DEFAULT_FN_ATTRS128 _mm_castbf16_ps(__m128bh __a) {
return (__m128)__a;
}
static __inline__ __m256 __DEFAULT_FN_ATTRS256
-_mm256_castpbf16_ps(__m256bh __a) {
+_mm256_castbf16_ps(__m256bh __a) {
return (__m256)__a;
}
static __inline__ __m256d __DEFAULT_FN_ATTRS256
-_mm256_castpbf16_pd(__m256bh __a) {
+_mm256_castbf16_pd(__m256bh __a) {
return (__m256d)__a;
}
-static __inline__ __m128d __DEFAULT_FN_ATTRS128 _mm_castpbf16_pd(__m128bh __a) {
+static __inline__ __m128d __DEFAULT_FN_ATTRS128 _mm_castbf16_pd(__m128bh __a) {
return (__m128d)__a;
}
static __inline__ __m128i __DEFAULT_FN_ATTRS128
-_mm_castpbf16_si128(__m128bh __a) {
+_mm_castbf16_si128(__m128bh __a) {
return (__m128i)__a;
}
static __inline__ __m256i __DEFAULT_FN_ATTRS256
-_mm256_castpbf16_si256(__m256bh __a) {
+_mm256_castbf16_si256(__m256bh __a) {
return (__m256i)__a;
}
@@ -100,18 +100,18 @@ _mm256_castsi256_pbh(__m256i __a) {
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS256
-_mm256_castpbf16256_pbh128(__m256bh __a) {
+_mm256_castbf16256_pbh128(__m256bh __a) {
return __builtin_shufflevector(__a, __a, 0, 1, 2, 3, 4, 5, 6, 7);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_castpbf16128_pbh256(__m128bh __a) {
+_mm256_castbf16128_pbh256(__m128bh __a) {
return __builtin_shufflevector(__a, __a, 0, 1, 2, 3, 4, 5, 6, 7, -1, -1, -1,
-1, -1, -1, -1, -1);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_zextpbf16128_pbh256(__m128bh __a) {
+_mm256_zextbf16128_pbh256(__m128bh __a) {
return __builtin_shufflevector(__a, (__v8bf)_mm_setzero_pbh(), 0, 1, 2, 3, 4,
5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15);
}
@@ -309,153 +309,149 @@ _mm256_permutexvar_pbh(__m256i __A, __m256bh __B) {
return (__m256bh)__builtin_ia32_permvarhi256((__v16hi)__B, (__v16hi)__A);
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_addne_pbh(__m256bh __A, __m256bh __B) {
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_add_pbh(__m256bh __A,
+ __m256bh __B) {
return (__m256bh)((__v16bf)__A + (__v16bf)__B);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_mask_addne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
+_mm256_mask_add_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
return (__m256bh)__builtin_ia32_selectpbf_256(
- (__mmask16)__U, (__v16bf)_mm256_addne_pbh(__A, __B), (__v16bf)__W);
+ (__mmask16)__U, (__v16bf)_mm256_add_pbh(__A, __B), (__v16bf)__W);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_maskz_addne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
+_mm256_maskz_add_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
return (__m256bh)__builtin_ia32_selectpbf_256(
- (__mmask16)__U, (__v16bf)_mm256_addne_pbh(__A, __B),
+ (__mmask16)__U, (__v16bf)_mm256_add_pbh(__A, __B),
(__v16bf)_mm256_setzero_pbh());
}
-static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_addne_pbh(__m128bh __A,
- __m128bh __B) {
+static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_add_pbh(__m128bh __A,
+ __m128bh __B) {
return (__m128bh)((__v8bf)__A + (__v8bf)__B);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_mask_addne_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) {
+_mm_mask_add_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, (__v8bf)_mm_addne_pbh(__A, __B), (__v8bf)__W);
+ (__mmask8)__U, (__v8bf)_mm_add_pbh(__A, __B), (__v8bf)__W);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_maskz_addne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) {
- return (__m128bh)__builtin_ia32_selectpbf_128((__mmask8)__U,
- (__v8bf)_mm_addne_pbh(__A, __B),
- (__v8bf)_mm_setzero_pbh());
+_mm_maskz_add_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) {
+ return (__m128bh)__builtin_ia32_selectpbf_128(
+ (__mmask8)__U, (__v8bf)_mm_add_pbh(__A, __B), (__v8bf)_mm_setzero_pbh());
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_subne_pbh(__m256bh __A, __m256bh __B) {
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_sub_pbh(__m256bh __A,
+ __m256bh __B) {
return (__m256bh)((__v16bf)__A - (__v16bf)__B);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_mask_subne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
+_mm256_mask_sub_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
return (__m256bh)__builtin_ia32_selectpbf_256(
- (__mmask16)__U, (__v16bf)_mm256_subne_pbh(__A, __B), (__v16bf)__W);
+ (__mmask16)__U, (__v16bf)_mm256_sub_pbh(__A, __B), (__v16bf)__W);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_maskz_subne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
+_mm256_maskz_sub_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
return (__m256bh)__builtin_ia32_selectpbf_256(
- (__mmask16)__U, (__v16bf)_mm256_subne_pbh(__A, __B),
+ (__mmask16)__U, (__v16bf)_mm256_sub_pbh(__A, __B),
(__v16bf)_mm256_setzero_pbh());
}
-static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_subne_pbh(__m128bh __A,
- __m128bh __B) {
+static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_sub_pbh(__m128bh __A,
+ __m128bh __B) {
return (__m128bh)((__v8bf)__A - (__v8bf)__B);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_mask_subne_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) {
+_mm_mask_sub_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, (__v8bf)_mm_subne_pbh(__A, __B), (__v8bf)__W);
+ (__mmask8)__U, (__v8bf)_mm_sub_pbh(__A, __B), (__v8bf)__W);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_maskz_subne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) {
- return (__m128bh)__builtin_ia32_selectpbf_128((__mmask8)__U,
- (__v8bf)_mm_subne_pbh(__A, __B),
- (__v8bf)_mm_setzero_pbh());
+_mm_maskz_sub_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) {
+ return (__m128bh)__builtin_ia32_selectpbf_128(
+ (__mmask8)__U, (__v8bf)_mm_sub_pbh(__A, __B), (__v8bf)_mm_setzero_pbh());
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_mulne_pbh(__m256bh __A, __m256bh __B) {
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mul_pbh(__m256bh __A,
+ __m256bh __B) {
return (__m256bh)((__v16bf)__A * (__v16bf)__B);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_mask_mulne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
+_mm256_mask_mul_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
return (__m256bh)__builtin_ia32_selectpbf_256(
- (__mmask16)__U, (__v16bf)_mm256_mulne_pbh(__A, __B), (__v16bf)__W);
+ (__mmask16)__U, (__v16bf)_mm256_mul_pbh(__A, __B), (__v16bf)__W);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_maskz_mulne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
+_mm256_maskz_mul_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
return (__m256bh)__builtin_ia32_selectpbf_256(
- (__mmask16)__U, (__v16bf)_mm256_mulne_pbh(__A, __B),
+ (__mmask16)__U, (__v16bf)_mm256_mul_pbh(__A, __B),
(__v16bf)_mm256_setzero_pbh());
}
-static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_mulne_pbh(__m128bh __A,
- __m128bh __B) {
+static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_mul_pbh(__m128bh __A,
+ __m128bh __B) {
return (__m128bh)((__v8bf)__A * (__v8bf)__B);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_mask_mulne_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) {
+_mm_mask_mul_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, (__v8bf)_mm_mulne_pbh(__A, __B), (__v8bf)__W);
+ (__mmask8)__U, (__v8bf)_mm_mul_pbh(__A, __B), (__v8bf)__W);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_maskz_mulne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) {
- return (__m128bh)__builtin_ia32_selectpbf_128((__mmask8)__U,
- (__v8bf)_mm_mulne_pbh(__A, __B),
- (__v8bf)_mm_setzero_pbh());
+_mm_maskz_mul_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) {
+ return (__m128bh)__builtin_ia32_selectpbf_128(
+ (__mmask8)__U, (__v8bf)_mm_mul_pbh(__A, __B), (__v8bf)_mm_setzero_pbh());
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_divne_pbh(__m256bh __A, __m256bh __B) {
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_div_pbh(__m256bh __A,
+ __m256bh __B) {
return (__m256bh)((__v16bf)__A / (__v16bf)__B);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_mask_divne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
+_mm256_mask_div_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
return (__m256bh)__builtin_ia32_selectpbf_256(
- (__mmask16)__U, (__v16bf)_mm256_divne_pbh(__A, __B), (__v16bf)__W);
+ (__mmask16)__U, (__v16bf)_mm256_div_pbh(__A, __B), (__v16bf)__W);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_maskz_divne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
+_mm256_maskz_div_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
return (__m256bh)__builtin_ia32_selectpbf_256(
- (__mmask16)__U, (__v16bf)_mm256_divne_pbh(__A, __B),
+ (__mmask16)__U, (__v16bf)_mm256_div_pbh(__A, __B),
(__v16bf)_mm256_setzero_pbh());
}
-static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_divne_pbh(__m128bh __A,
- __m128bh __B) {
+static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_div_pbh(__m128bh __A,
+ __m128bh __B) {
return (__m128bh)((__v8bf)__A / (__v8bf)__B);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_mask_divne_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) {
+_mm_mask_div_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, (__v8bf)_mm_divne_pbh(__A, __B), (__v8bf)__W);
+ (__mmask8)__U, (__v8bf)_mm_div_pbh(__A, __B), (__v8bf)__W);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_maskz_divne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) {
- return (__m128bh)__builtin_ia32_selectpbf_128((__mmask8)__U,
- (__v8bf)_mm_divne_pbh(__A, __B),
- (__v8bf)_mm_setzero_pbh());
+_mm_maskz_div_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) {
+ return (__m128bh)__builtin_ia32_selectpbf_128(
+ (__mmask8)__U, (__v8bf)_mm_div_pbh(__A, __B), (__v8bf)_mm_setzero_pbh());
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_max_pbh(__m256bh __A,
__m256bh __B) {
- return (__m256bh)__builtin_ia32_vmaxpbf16256((__v16bf)__A, (__v16bf)__B);
+ return (__m256bh)__builtin_ia32_vmaxbf16256((__v16bf)__A, (__v16bf)__B);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
@@ -473,7 +469,7 @@ _mm256_maskz_max_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_max_pbh(__m128bh __A,
__m128bh __B) {
- return (__m128bh)__builtin_ia32_vmaxpbf16128((__v8bf)__A, (__v8bf)__B);
+ return (__m128bh)__builtin_ia32_vmaxbf16128((__v8bf)__A, (__v8bf)__B);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
@@ -490,7 +486,7 @@ _mm_maskz_max_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) {
static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_min_pbh(__m256bh __A,
__m256bh __B) {
- return (__m256bh)__builtin_ia32_vminpbf16256((__v16bf)__A, (__v16bf)__B);
+ return (__m256bh)__builtin_ia32_vminbf16256((__v16bf)__A, (__v16bf)__B);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
@@ -508,7 +504,7 @@ _mm256_maskz_min_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_min_pbh(__m128bh __A,
__m128bh __B) {
- return (__m128bh)__builtin_ia32_vminpbf16128((__v8bf)__A, (__v8bf)__B);
+ return (__m128bh)__builtin_ia32_vminbf16128((__v8bf)__A, (__v8bf)__B);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
@@ -554,275 +550,275 @@ static __inline__ int __DEFAULT_FN_ATTRS128 _mm_comneqsbh(__m128bh A,
}
#define _mm256_cmp_pbh_mask(__A, __B, __P) \
- ((__mmask16)__builtin_ia32_vcmppbf16256_mask((__v16bf)(__m256bh)(__A), \
- (__v16bf)(__m256bh)(__B), \
- (int)(__P), (__mmask16) - 1))
+ ((__mmask16)__builtin_ia32_vcmpbf16256_mask((__v16bf)(__m256bh)(__A), \
+ (__v16bf)(__m256bh)(__B), \
+ (int)(__P), (__mmask16) - 1))
#define _mm256_mask_cmp_pbh_mask(__U, __A, __B, __P) \
- ((__mmask16)__builtin_ia32_vcmppbf16256_mask((__v16bf)(__m256bh)(__A), \
- (__v16bf)(__m256bh)(__B), \
- (int)(__P), (__mmask16)(__U)))
+ ((__mmask16)__builtin_ia32_vcmpbf16256_mask((__v16bf)(__m256bh)(__A), \
+ (__v16bf)(__m256bh)(__B), \
+ (int)(__P), (__mmask16)(__U)))
#define _mm_cmp_pbh_mask(__A, __B, __P) \
- ((__mmask8)__builtin_ia32_vcmppbf16128_mask((__v8bf)(__m128bh)(__A), \
- (__v8bf)(__m128bh)(__B), \
- (int)(__P), (__mmask8) - 1))
+ ((__mmask8)__builtin_ia32_vcmpbf16128_mask((__v8bf)(__m128bh)(__A), \
+ (__v8bf)(__m128bh)(__B), \
+ (int)(__P), (__mmask8) - 1))
#define _mm_mask_cmp_pbh_mask(__U, __A, __B, __P) \
- ((__mmask8)__builtin_ia32_vcmppbf16128_mask((__v8bf)(__m128bh)(__A), \
- (__v8bf)(__m128bh)(__B), \
- (int)(__P), (__mmask8)(__U)))
+ ((__mmask8)__builtin_ia32_vcmpbf16128_mask((__v8bf)(__m128bh)(__A), \
+ (__v8bf)(__m128bh)(__B), \
+ (int)(__P), (__mmask8)(__U)))
#define _mm256_mask_fpclass_pbh_mask(__U, __A, imm) \
- ((__mmask16)__builtin_ia32_vfpclasspbf16256_mask( \
+ ((__mmask16)__builtin_ia32_vfpclassbf16256_mask( \
(__v16bf)(__m256bh)(__A), (int)(imm), (__mmask16)(__U)))
#define _mm256_fpclass_pbh_mask(__A, imm) \
- ((__mmask16)__builtin_ia32_vfpclasspbf16256_mask( \
+ ((__mmask16)__builtin_ia32_vfpclassbf16256_mask( \
(__v16bf)(__m256bh)(__A), (int)(imm), (__mmask16) - 1))
#define _mm_mask_fpclass_pbh_mask(__U, __A, imm) \
- ((__mmask8)__builtin_ia32_vfpclasspbf16128_mask( \
- (__v8bf)(__m128bh)(__A), (int)(imm), (__mmask8)(__U)))
+ ((__mmask8)__builtin_ia32_vfpclassbf16128_mask((__v8bf)(__m128bh)(__A), \
+ (int)(imm), (__mmask8)(__U)))
#define _mm_fpclass_pbh_mask(__A, imm) \
- ((__mmask8)__builtin_ia32_vfpclasspbf16128_mask((__v8bf)(__m128bh)(__A), \
- (int)(imm), (__mmask8) - 1))
+ ((__mmask8)__builtin_ia32_vfpclassbf16128_mask((__v8bf)(__m128bh)(__A), \
+ (int)(imm), (__mmask8) - 1))
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
_mm256_scalef_pbh(__m256bh __A, __m256bh __B) {
- return (__m256bh)__builtin_ia32_vscalefpbf16256_mask(
+ return (__m256bh)__builtin_ia32_vscalefbf16256_mask(
(__v16bf)__A, (__v16bf)__B, (__v16bf)_mm256_undefined_pbh(),
(__mmask16)-1);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_scalef_pbh(
__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
- return (__m256bh)__builtin_ia32_vscalefpbf16256_mask(
+ return (__m256bh)__builtin_ia32_vscalefbf16256_mask(
(__v16bf)__A, (__v16bf)__B, (__v16bf)__W, (__mmask16)__U);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
_mm256_maskz_scalef_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
- return (__m256bh)__builtin_ia32_vscalefpbf16256_mask(
+ return (__m256bh)__builtin_ia32_vscalefbf16256_mask(
(__v16bf)__A, (__v16bf)__B, (__v16bf)_mm256_setzero_pbh(),
(__mmask16)__U);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_scalef_pbh(__m128bh __A,
__m128bh __B) {
- return (__m128bh)__builtin_ia32_vscalefpbf16128_mask(
+ return (__m128bh)__builtin_ia32_vscalefbf16128_mask(
(__v8bf)__A, (__v8bf)__B, (__v8bf)_mm_undefined_pbh(), (__mmask8)-1);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
_mm_mask_scalef_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) {
- return (__m128bh)__builtin_ia32_vscalefpbf16128_mask(
+ return (__m128bh)__builtin_ia32_vscalefbf16128_mask(
(__v8bf)__A, (__v8bf)__B, (__v8bf)__W, (__mmask8)__U);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
_mm_maskz_scalef_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) {
- return (__m128bh)__builtin_ia32_vscalefpbf16128_mask(
+ return (__m128bh)__builtin_ia32_vscalefbf16128_mask(
(__v8bf)__A, (__v8bf)__B, (__v8bf)_mm_setzero_pbh(), (__mmask8)__U);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_rcp_pbh(__m256bh __A) {
- return (__m256bh)__builtin_ia32_vrcppbf16256_mask(
+ return (__m256bh)__builtin_ia32_vrcpbf16256_mask(
(__v16bf)__A, (__v16bf)_mm256_undefined_pbh(), (__mmask16)-1);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
_mm256_mask_rcp_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) {
- return (__m256bh)__builtin_ia32_vrcppbf16256_mask((__v16bf)__A, (__v16bf)__W,
- (__mmask16)__U);
+ return (__m256bh)__builtin_ia32_vrcpbf16256_mask((__v16bf)__A, (__v16bf)__W,
+ (__mmask16)__U);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
_mm256_maskz_rcp_pbh(__mmask16 __U, __m256bh __A) {
- return (__m256bh)__builtin_ia32_vrcppbf16256_mask(
+ return (__m256bh)__builtin_ia32_vrcpbf16256_mask(
(__v16bf)__A, (__v16bf)_mm256_setzero_pbh(), (__mmask16)__U);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_rcp_pbh(__m128bh __A) {
- return (__m128bh)__builtin_ia32_vrcppbf16128_mask(
+ return (__m128bh)__builtin_ia32_vrcpbf16128_mask(
(__v8bf)__A, (__v8bf)_mm_undefined_pbh(), (__mmask8)-1);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
_mm_mask_rcp_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) {
- return (__m128bh)__builtin_ia32_vrcppbf16128_mask((__v8bf)__A, (__v8bf)__W,
- (__mmask8)__U);
+ return (__m128bh)__builtin_ia32_vrcpbf16128_mask((__v8bf)__A, (__v8bf)__W,
+ (__mmask8)__U);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
_mm_maskz_rcp_pbh(__mmask8 __U, __m128bh __A) {
- return (__m128bh)__builtin_ia32_vrcppbf16128_mask(
+ return (__m128bh)__builtin_ia32_vrcpbf16128_mask(
(__v8bf)__A, (__v8bf)_mm_setzero_pbh(), (__mmask8)__U);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
_mm256_getexp_pbh(__m256bh __A) {
- return (__m256bh)__builtin_ia32_vgetexppbf16256_mask(
+ return (__m256bh)__builtin_ia32_vgetexpbf16256_mask(
(__v16bf)__A, (__v16bf)_mm256_undefined_pbh(), (__mmask16)-1);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
_mm256_mask_getexp_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) {
- return (__m256bh)__builtin_ia32_vgetexppbf16256_mask(
+ return (__m256bh)__builtin_ia32_vgetexpbf16256_mask(
(__v16bf)__A, (__v16bf)__W, (__mmask16)__U);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
_mm256_maskz_getexp_pbh(__mmask16 __U, __m256bh __A) {
- return (__m256bh)__builtin_ia32_vgetexppbf16256_mask(
+ return (__m256bh)__builtin_ia32_vgetexpbf16256_mask(
(__v16bf)__A, (__v16bf)_mm256_setzero_pbh(), (__mmask16)__U);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_getexp_pbh(__m128bh __A) {
- return (__m128bh)__builtin_ia32_vgetexppbf16128_mask(
+ return (__m128bh)__builtin_ia32_vgetexpbf16128_mask(
(__v8bf)__A, (__v8bf)_mm_undefined_pbh(), (__mmask8)-1);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
_mm_mask_getexp_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) {
- return (__m128bh)__builtin_ia32_vgetexppbf16128_mask((__v8bf)__A, (__v8bf)__W,
- (__mmask8)__U);
+ return (__m128bh)__builtin_ia32_vgetexpbf16128_mask((__v8bf)__A, (__v8bf)__W,
+ (__mmask8)__U);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
_mm_maskz_getexp_pbh(__mmask8 __U, __m128bh __A) {
- return (__m128bh)__builtin_ia32_vgetexppbf16128_mask(
+ return (__m128bh)__builtin_ia32_vgetexpbf16128_mask(
(__v8bf)__A, (__v8bf)_mm_setzero_pbh(), (__mmask8)__U);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
_mm256_rsqrt_pbh(__m256bh __A) {
- return (__m256bh)__builtin_ia32_vrsqrtpbf16256_mask(
+ return (__m256bh)__builtin_ia32_vrsqrtbf16256_mask(
(__v16bf)__A, (__v16bf)_mm256_undefined_pbh(), (__mmask16)-1);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
_mm256_mask_rsqrt_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) {
- return (__m256bh)__builtin_ia32_vrsqrtpbf16256_mask(
- (__v16bf)__A, (__v16bf)__W, (__mmask16)__U);
+ return (__m256bh)__builtin_ia32_vrsqrtbf16256_mask((__v16bf)__A, (__v16bf)__W,
+ (__mmask16)__U);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
_mm256_maskz_rsqrt_pbh(__mmask16 __U, __m256bh __A) {
- return (__m256bh)__builtin_ia32_vrsqrtpbf16256_mask(
+ return (__m256bh)__builtin_ia32_vrsqrtbf16256_mask(
(__v16bf)__A, (__v16bf)_mm256_setzero_pbh(), (__mmask16)__U);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_rsqrt_pbh(__m128bh __A) {
- return (__m128bh)__builtin_ia32_vrsqrtpbf16128_mask(
+ return (__m128bh)__builtin_ia32_vrsqrtbf16128_mask(
(__v8bf)__A, (__v8bf)_mm_undefined_pbh(), (__mmask8)-1);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
_mm_mask_rsqrt_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) {
- return (__m128bh)__builtin_ia32_vrsqrtpbf16128_mask((__v8bf)__A, (__v8bf)__W,
- (__mmask8)__U);
+ return (__m128bh)__builtin_ia32_vrsqrtbf16128_mask((__v8bf)__A, (__v8bf)__W,
+ (__mmask8)__U);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
_mm_maskz_rsqrt_pbh(__mmask8 __U, __m128bh __A) {
- return (__m128bh)__builtin_ia32_vrsqrtpbf16128_mask(
+ return (__m128bh)__builtin_ia32_vrsqrtbf16128_mask(
(__v8bf)__A, (__v8bf)_mm_setzero_pbh(), (__mmask8)__U);
}
-#define _mm256_reducene_pbh(__A, imm) \
- ((__m256bh)__builtin_ia32_vreducenepbf16256_mask( \
+#define _mm256_reduce_pbh(__A, imm) \
+ ((__m256bh)__builtin_ia32_vreducebf16256_mask( \
(__v16bf)(__m256bh)(__A), (int)(imm), (__v16bf)_mm256_undefined_pbh(), \
(__mmask16) - 1))
-#define _mm256_mask_reducene_pbh(__W, __U, __A, imm) \
- ((__m256bh)__builtin_ia32_vreducenepbf16256_mask( \
+#define _mm256_mask_reduce_pbh(__W, __U, __A, imm) \
+ ((__m256bh)__builtin_ia32_vreducebf16256_mask( \
(__v16bf)(__m256bh)(__A), (int)(imm), (__v16bf)(__m256bh)(__W), \
(__mmask16)(__U)))
-#define _mm256_maskz_reducene_pbh(__U, __A, imm) \
- ((__m256bh)__builtin_ia32_vreducenepbf16256_mask( \
+#define _mm256_maskz_reduce_pbh(__U, __A, imm) \
+ ((__m256bh)__builtin_ia32_vreducebf16256_mask( \
(__v16bf)(__m256bh)(__A), (int)(imm), (__v16bf)_mm256_setzero_pbh(), \
(__mmask16)(__U)))
-#define _mm_reducene_pbh(__A, imm) \
- ((__m128bh)__builtin_ia32_vreducenepbf16128_mask( \
+#define _mm_reduce_pbh(__A, imm) \
+ ((__m128bh)__builtin_ia32_vreducebf16128_mask( \
(__v8bf)(__m128bh)(__A), (int)(imm), (__v8bf)_mm_undefined_pbh(), \
(__mmask8) - 1))
-#define _mm_mask_reducene_pbh(__W, __U, __A, imm) \
- ((__m128bh)__builtin_ia32_vreducenepbf16128_mask( \
+#define _mm_mask_reduce_pbh(__W, __U, __A, imm) \
+ ((__m128bh)__builtin_ia32_vreducebf16128_mask( \
(__v8bf)(__m128bh)(__A), (int)(imm), (__v8bf)(__m128bh)(__W), \
(__mmask8)(__U)))
-#define _mm_maskz_reducene_pbh(__U, __A, imm) \
- ((__m128bh)__builtin_ia32_vreducenepbf16128_mask( \
+#define _mm_maskz_reduce_pbh(__U, __A, imm) \
+ ((__m128bh)__builtin_ia32_vreducebf16128_mask( \
(__v8bf)(__m128bh)(__A), (int)(imm), (__v8bf)_mm_setzero_pbh(), \
(__mmask8)(__U)))
-#define _mm256_roundscalene_pbh(__A, imm) \
- ((__m256bh)__builtin_ia32_vrndscalenepbf16_256_mask( \
+#define _mm256_roundscale_pbh(__A, imm) \
+ ((__m256bh)__builtin_ia32_vrndscalebf16_256_mask( \
(__v16bf)(__m256bh)(__A), (int)(imm), (__v16bf)_mm256_setzero_pbh(), \
(__mmask16) - 1))
-#define _mm256_mask_roundscalene_pbh(__W, __U, __A, imm) \
- ((__m256bh)__builtin_ia32_vrndscalenepbf16_256_mask( \
+#define _mm256_mask_roundscale_pbh(__W, __U, __A, imm) \
+ ((__m256bh)__builtin_ia32_vrndscalebf16_256_mask( \
(__v16bf)(__m256bh)(__A), (int)(imm), (__v16bf)(__m256bh)(__W), \
(__mmask16)(__U)))
-#define _mm256_maskz_roundscalene_pbh(__U, __A, imm) \
- ((__m256bh)__builtin_ia32_vrndscalenepbf16_256_mask( \
+#define _mm256_maskz_roundscale_pbh(__U, __A, imm) \
+ ((__m256bh)__builtin_ia32_vrndscalebf16_256_mask( \
(__v16bf)(__m256bh)(__A), (int)(imm), (__v16bf)_mm256_setzero_pbh(), \
(__mmask16)(__U)))
-#define _mm_roundscalene_pbh(__A, imm) \
- ((__m128bh)__builtin_ia32_vrndscalenepbf16_128_mask( \
+#define _mm_roundscale_pbh(__A, imm) \
+ ((__m128bh)__builtin_ia32_vrndscalebf16_128_mask( \
(__v8bf)(__m128bh)(__A), (int)(imm), (__v8bf)_mm_setzero_pbh(), \
(__mmask8) - 1))
-#define _mm_mask_roundscalene_pbh(__W, __U, __A, imm) \
- ((__m128bh)__builtin_ia32_vrndscalenepbf16_128_mask( \
+#define _mm_mask_roundscale_pbh(__W, __U, __A, imm) \
+ ((__m128bh)__builtin_ia32_vrndscalebf16_128_mask( \
(__v8bf)(__m128bh)(__A), (int)(imm), (__v8bf)(__m128bh)(__W), \
(__mmask8)(__U)))
-#define _mm_maskz_roundscalene_pbh(__U, __A, imm) \
- ((__m128bh)__builtin_ia32_vrndscalenepbf16_128_mask( \
+#define _mm_maskz_roundscale_pbh(__U, __A, imm) \
+ ((__m128bh)__builtin_ia32_vrndscalebf16_128_mask( \
(__v8bf)(__m128bh)(__A), (int)(imm), (__v8bf)_mm_setzero_pbh(), \
(__mmask8)(__U)))
#define _mm256_getmant_pbh(__A, __B, __C) \
- ((__m256bh)__builtin_ia32_vgetmantpbf16256_mask( \
+ ((__m256bh)__builtin_ia32_vgetmantbf16256_mask( \
(__v16bf)(__m256bh)(__A), (int)(((__C) << 2) | (__B)), \
(__v16bf)_mm256_undefined_pbh(), (__mmask16) - 1))
#define _mm256_mask_getmant_pbh(__W, __U, __A, __B, __C) \
- ((__m256bh)__builtin_ia32_vgetmantpbf16256_mask( \
+ ((__m256bh)__builtin_ia32_vgetmantbf16256_mask( \
(__v16bf)(__m256bh)(__A), (int)(((__C) << 2) | (__B)), \
(__v16bf)(__m256bh)(__W), (__mmask16)(__U)))
#define _mm256_maskz_getmant_pbh(__U, __A, __B, __C) \
- ((__m256bh)__builtin_ia32_vgetmantpbf16256_mask( \
+ ((__m256bh)__builtin_ia32_vgetmantbf16256_mask( \
(__v16bf)(__m256bh)(__A), (int)(((__C) << 2) | (__B)), \
(__v16bf)_mm256_setzero_pbh(), (__mmask16)(__U)))
#define _mm_getmant_pbh(__A, __B, __C) \
- ((__m128bh)__builtin_ia32_vgetmantpbf16128_mask( \
+ ((__m128bh)__builtin_ia32_vgetmantbf16128_mask( \
(__v8bf)(__m128bh)(__A), (int)(((__C) << 2) | (__B)), \
(__v8bf)_mm_undefined_pbh(), (__mmask8) - 1))
#define _mm_mask_getmant_pbh(__W, __U, __A, __B, __C) \
- ((__m128bh)__builtin_ia32_vgetmantpbf16128_mask( \
+ ((__m128bh)__builtin_ia32_vgetmantbf16128_mask( \
(__v8bf)(__m128bh)(__A), (int)(((__C) << 2) | (__B)), \
(__v8bf)(__m128bh)(__W), (__mmask8)(__U)))
#define _mm_maskz_getmant_pbh(__U, __A, __B, __C) \
- ((__m128bh)__builtin_ia32_vgetmantpbf16128_mask( \
+ ((__m128bh)__builtin_ia32_vgetmantbf16128_mask( \
(__v8bf)(__m128bh)(__A), (int)(((__C) << 2) | (__B)), \
(__v8bf)_mm_setzero_pbh(), (__mmask8)(__U)))
static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_sqrt_pbh(__m256bh __A) {
- return (__m256bh)__builtin_ia32_vsqrtnepbf16256((__v16bf)__A);
+ return (__m256bh)__builtin_ia32_vsqrtbf16256((__v16bf)__A);
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
@@ -839,7 +835,7 @@ _mm256_maskz_sqrt_pbh(__mmask16 __U, __m256bh __A) {
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_sqrt_pbh(__m128bh __A) {
- return (__m128bh)__builtin_ia32_vsqrtnepbf16((__v8bf)__A);
+ return (__m128bh)__builtin_ia32_vsqrtbf16((__v8bf)__A);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
@@ -855,232 +851,230 @@ _mm_maskz_sqrt_pbh(__mmask8 __U, __m128bh __A) {
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_fmaddne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
+_mm256_fmadd_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
return (__m256bh)__builtin_ia32_vfmaddnepbh256((__v16bf)__A, (__v16bf)__B,
(__v16bf)__C);
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_fmaddne_pbh(
- __m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) {
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256
+_mm256_mask_fmadd_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) {
return (__m256bh)__builtin_ia32_selectpbf_256(
(__mmask16)__U,
- _mm256_fmaddne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
- (__v16bf)__A);
+ _mm256_fmadd_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)__A);
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fmaddne_pbh(
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fmadd_pbh(
__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) {
return (__m256bh)__builtin_ia32_selectpbf_256(
(__mmask16)__U,
- _mm256_fmaddne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
- (__v16bf)__C);
+ _mm256_fmadd_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)__C);
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fmaddne_pbh(
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fmadd_pbh(
__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) {
return (__m256bh)__builtin_ia32_selectpbf_256(
(__mmask16)__U,
- _mm256_fmaddne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
+ _mm256_fmadd_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
(__v16bf)_mm256_setzero_pbh());
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_fmsubne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
+_mm256_fmsub_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
return (__m256bh)__builtin_ia32_vfmaddnepbh256((__v16bf)__A, (__v16bf)__B,
-(__v16bf)__C);
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_fmsubne_pbh(
- __m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) {
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256
+_mm256_mask_fmsub_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) {
return (__m256bh)__builtin_ia32_selectpbf_256(
(__mmask16)__U,
- _mm256_fmsubne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
- (__v16bf)__A);
+ _mm256_fmsub_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)__A);
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fmsubne_pbh(
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fmsub_pbh(
__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) {
return (__m256bh)__builtin_ia32_selectpbf_256(
(__mmask16)__U,
- _mm256_fmsubne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
- (__v16bf)__C);
+ _mm256_fmsub_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)__C);
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fmsubne_pbh(
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fmsub_pbh(
__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) {
return (__m256bh)__builtin_ia32_selectpbf_256(
(__mmask16)__U,
- _mm256_fmsubne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
+ _mm256_fmsub_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
(__v16bf)_mm256_setzero_pbh());
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_fnmaddne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
+_mm256_fnmadd_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
return (__m256bh)__builtin_ia32_vfmaddnepbh256((__v16bf)__A, -(__v16bf)__B,
(__v16bf)__C);
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_fnmaddne_pbh(
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_fnmadd_pbh(
__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) {
return (__m256bh)__builtin_ia32_selectpbf_256(
(__mmask16)__U,
- _mm256_fnmaddne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
+ _mm256_fnmadd_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
(__v16bf)__A);
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fnmaddne_pbh(
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fnmadd_pbh(
__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) {
return (__m256bh)__builtin_ia32_selectpbf_256(
(__mmask16)__U,
- _mm256_fnmaddne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
+ _mm256_fnmadd_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
(__v16bf)__C);
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fnmaddne_pbh(
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fnmadd_pbh(
__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) {
return (__m256bh)__builtin_ia32_selectpbf_256(
(__mmask16)__U,
- _mm256_fnmaddne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
+ _mm256_fnmadd_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
(__v16bf)_mm256_setzero_pbh());
}
static __inline__ __m256bh __DEFAULT_FN_ATTRS256
-_mm256_fnmsubne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
+_mm256_fnmsub_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
return (__m256bh)__builtin_ia32_vfmaddnepbh256((__v16bf)__A, -(__v16bf)__B,
-(__v16bf)__C);
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_fnmsubne_pbh(
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_fnmsub_pbh(
__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) {
return (__m256bh)__builtin_ia32_selectpbf_256(
(__mmask16)__U,
- _mm256_fnmsubne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
+ _mm256_fnmsub_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
(__v16bf)__A);
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fnmsubne_pbh(
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fnmsub_pbh(
__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) {
return (__m256bh)__builtin_ia32_selectpbf_256(
(__mmask16)__U,
- _mm256_fnmsubne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
+ _mm256_fnmsub_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
(__v16bf)__C);
}
-static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fnmsubne_pbh(
+static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fnmsub_pbh(
__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) {
return (__m256bh)__builtin_ia32_selectpbf_256(
(__mmask16)__U,
- _mm256_fnmsubne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
+ _mm256_fnmsub_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C),
(__v16bf)_mm256_setzero_pbh());
}
-static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_fmaddne_pbh(__m128bh __A,
- __m128bh __B,
- __m128bh __C) {
+static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_fmadd_pbh(__m128bh __A,
+ __m128bh __B,
+ __m128bh __C) {
return (__m128bh)__builtin_ia32_vfmaddnepbh128((__v8bf)__A, (__v8bf)__B,
(__v8bf)__C);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_mask_fmaddne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
+_mm_mask_fmadd_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, _mm_fmaddne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
+ (__mmask8)__U, _mm_fmadd_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
(__v8bf)__A);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_mask3_fmaddne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
+_mm_mask3_fmadd_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, _mm_fmaddne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
+ (__mmask8)__U, _mm_fmadd_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
(__v8bf)__C);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_maskz_fmaddne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
+_mm_maskz_fmadd_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, _mm_fmaddne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
+ (__mmask8)__U, _mm_fmadd_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
(__v8bf)_mm_setzero_pbh());
}
-static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_fmsubne_pbh(__m128bh __A,
- __m128bh __B,
- __m128bh __C) {
+static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_fmsub_pbh(__m128bh __A,
+ __m128bh __B,
+ __m128bh __C) {
return (__m128bh)__builtin_ia32_vfmaddnepbh128((__v8bf)__A, (__v8bf)__B,
-(__v8bf)__C);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_mask_fmsubne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
+_mm_mask_fmsub_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, _mm_fmsubne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
+ (__mmask8)__U, _mm_fmsub_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
(__v8bf)__A);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_mask3_fmsubne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
+_mm_mask3_fmsub_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, _mm_fmsubne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
+ (__mmask8)__U, _mm_fmsub_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
(__v8bf)__C);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_maskz_fmsubne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
+_mm_maskz_fmsub_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, _mm_fmsubne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
+ (__mmask8)__U, _mm_fmsub_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
(__v8bf)_mm_setzero_pbh());
}
-static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_fnmaddne_pbh(__m128bh __A, __m128bh __B, __m128bh __C) {
+static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_fnmadd_pbh(__m128bh __A,
+ __m128bh __B,
+ __m128bh __C) {
return (__m128bh)__builtin_ia32_vfmaddnepbh128((__v8bf)__A, -(__v8bf)__B,
(__v8bf)__C);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_mask_fnmaddne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
+_mm_mask_fnmadd_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, _mm_fnmaddne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
+ (__mmask8)__U, _mm_fnmadd_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
(__v8bf)__A);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_mask3_fnmaddne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
+_mm_mask3_fnmadd_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, _mm_fnmaddne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
+ (__mmask8)__U, _mm_fnmadd_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
(__v8bf)__C);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_maskz_fnmaddne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
+_mm_maskz_fnmadd_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, _mm_fnmaddne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
+ (__mmask8)__U, _mm_fnmadd_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
(__v8bf)_mm_setzero_pbh());
}
-static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_fnmsubne_pbh(__m128bh __A, __m128bh __B, __m128bh __C) {
+static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_fnmsub_pbh(__m128bh __A,
+ __m128bh __B,
+ __m128bh __C) {
return (__m128bh)__builtin_ia32_vfmaddnepbh128((__v8bf)__A, -(__v8bf)__B,
-(__v8bf)__C);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_mask_fnmsubne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
+_mm_mask_fnmsub_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, _mm_fnmsubne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
+ (__mmask8)__U, _mm_fnmsub_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
(__v8bf)__A);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_mask3_fnmsubne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
+_mm_mask3_fnmsub_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, _mm_fnmsubne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
+ (__mmask8)__U, _mm_fnmsub_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
(__v8bf)__C);
}
static __inline__ __m128bh __DEFAULT_FN_ATTRS128
-_mm_maskz_fnmsubne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
+_mm_maskz_fnmsub_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
return (__m128bh)__builtin_ia32_selectpbf_128(
- (__mmask8)__U, _mm_fnmsubne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
+ (__mmask8)__U, _mm_fnmsub_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C),
(__v8bf)_mm_setzero_pbh());
}
diff --git a/clang/lib/Sema/SemaX86.cpp b/clang/lib/Sema/SemaX86.cpp
index 0b4b78c5b15dc5..39c8ce1534c229 100644
--- a/clang/lib/Sema/SemaX86.cpp
+++ b/clang/lib/Sema/SemaX86.cpp
@@ -931,9 +931,9 @@ bool SemaX86::CheckBuiltinFunctionCall(const TargetInfo &TI, unsigned BuiltinID,
case X86::BI__builtin_ia32_rndscaleps_mask:
case X86::BI__builtin_ia32_rndscalepd_mask:
case X86::BI__builtin_ia32_rndscaleph_mask:
- case X86::BI__builtin_ia32_vrndscalenepbf16_128_mask:
- case X86::BI__builtin_ia32_vrndscalenepbf16_256_mask:
- case X86::BI__builtin_ia32_vrndscalenepbf16_mask:
+ case X86::BI__builtin_ia32_vrndscalebf16_128_mask:
+ case X86::BI__builtin_ia32_vrndscalebf16_256_mask:
+ case X86::BI__builtin_ia32_vrndscalebf16_mask:
case X86::BI__builtin_ia32_reducepd128_mask:
case X86::BI__builtin_ia32_reducepd256_mask:
case X86::BI__builtin_ia32_reducepd512_mask:
@@ -943,9 +943,9 @@ bool SemaX86::CheckBuiltinFunctionCall(const TargetInfo &TI, unsigned BuiltinID,
case X86::BI__builtin_ia32_reduceph128_mask:
case X86::BI__builtin_ia32_reduceph256_mask:
case X86::BI__builtin_ia32_reduceph512_mask:
- case X86::BI__builtin_ia32_vreducenepbf16128_mask:
- case X86::BI__builtin_ia32_vreducenepbf16256_mask:
- case X86::BI__builtin_ia32_vreducenepbf16512_mask:
+ case X86::BI__builtin_ia32_vreducebf16128_mask:
+ case X86::BI__builtin_ia32_vreducebf16256_mask:
+ case X86::BI__builtin_ia32_vreducebf16512_mask:
case X86::BI__builtin_ia32_vreducepd256_round_mask:
case X86::BI__builtin_ia32_vreduceps256_round_mask:
case X86::BI__builtin_ia32_vreduceph256_round_mask:
@@ -973,9 +973,9 @@ bool SemaX86::CheckBuiltinFunctionCall(const TargetInfo &TI, unsigned BuiltinID,
case X86::BI__builtin_ia32_fpclassph128_mask:
case X86::BI__builtin_ia32_fpclassph256_mask:
case X86::BI__builtin_ia32_fpclassph512_mask:
- case X86::BI__builtin_ia32_vfpclasspbf16128_mask:
- case X86::BI__builtin_ia32_vfpclasspbf16256_mask:
- case X86::BI__builtin_ia32_vfpclasspbf16512_mask:
+ case X86::BI__builtin_ia32_vfpclassbf16128_mask:
+ case X86::BI__builtin_ia32_vfpclassbf16256_mask:
+ case X86::BI__builtin_ia32_vfpclassbf16512_mask:
case X86::BI__builtin_ia32_fpclasssd_mask:
case X86::BI__builtin_ia32_fpclassss_mask:
case X86::BI__builtin_ia32_fpclasssh_mask:
diff --git a/clang/test/CodeGen/X86/avx10_2_512bf16-builtins.c b/clang/test/CodeGen/X86/avx10_2_512bf16-builtins.c
index b00859c174fbab..78405d63984f64 100644
--- a/clang/test/CodeGen/X86/avx10_2_512bf16-builtins.c
+++ b/clang/test/CodeGen/X86/avx10_2_512bf16-builtins.c
@@ -146,22 +146,22 @@ __m512bh test_mm512_setr_pbh(__bf16 bf1, __bf16 bf2, __bf16 bf3, __bf16 bf4,
bf25, bf26, bf27, bf28, bf29, bf30, bf31, bf32);
}
-__m512 test_mm512_castpbf16_ps(__m512bh A) {
- // CHECK-LABEL: test_mm512_castpbf16_ps
+__m512 test_mm512_castbf16_ps(__m512bh A) {
+ // CHECK-LABEL: test_mm512_castbf16_ps
// CHECK: bitcast <32 x bfloat> %{{.*}} to <16 x float>
- return _mm512_castpbf16_ps(A);
+ return _mm512_castbf16_ps(A);
}
-__m512d test_mm512_castpbf16_pd(__m512bh A) {
- // CHECK-LABEL: test_mm512_castpbf16_pd
+__m512d test_mm512_castbf16_pd(__m512bh A) {
+ // CHECK-LABEL: test_mm512_castbf16_pd
// CHECK: bitcast <32 x bfloat> %{{.*}} to <8 x double>
- return _mm512_castpbf16_pd(A);
+ return _mm512_castbf16_pd(A);
}
-__m512i test_mm512_castpbf16_si512(__m512bh A) {
- // CHECK-LABEL: test_mm512_castpbf16_si512
+__m512i test_mm512_castbf16_si512(__m512bh A) {
+ // CHECK-LABEL: test_mm512_castbf16_si512
// CHECK: bitcast <32 x bfloat> %{{.*}} to <8 x i64>
- return _mm512_castpbf16_si512(A);
+ return _mm512_castbf16_si512(A);
}
__m512bh test_mm512_castps_pbh(__m512 A) {
@@ -182,40 +182,40 @@ __m512bh test_mm512_castsi512_pbh(__m512i A) {
return _mm512_castsi512_pbh(A);
}
-__m128bh test_mm512_castpbf16512_pbh128(__m512bh __a) {
- // CHECK-LABEL: test_mm512_castpbf16512_pbh128
+__m128bh test_mm512_castbf16512_pbh128(__m512bh __a) {
+ // CHECK-LABEL: test_mm512_castbf16512_pbh128
// CHECK: shufflevector <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
- return _mm512_castpbf16512_pbh128(__a);
+ return _mm512_castbf16512_pbh128(__a);
}
-__m256bh test_mm512_castpbf16512_pbh256(__m512bh __a) {
- // CHECK-LABEL: test_mm512_castpbf16512_pbh256
+__m256bh test_mm512_castbf16512_pbh256(__m512bh __a) {
+ // CHECK-LABEL: test_mm512_castbf16512_pbh256
// CHECK: shufflevector <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
- return _mm512_castpbf16512_pbh256(__a);
+ return _mm512_castbf16512_pbh256(__a);
}
-__m512bh test_mm512_castpbf16128_pbh512(__m128bh __a) {
- // CHECK-LABEL: test_mm512_castpbf16128_pbh512
+__m512bh test_mm512_castbf16128_pbh512(__m128bh __a) {
+ // CHECK-LABEL: test_mm512_castbf16128_pbh512
// CHECK: shufflevector <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <32 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison>
- return _mm512_castpbf16128_pbh512(__a);
+ return _mm512_castbf16128_pbh512(__a);
}
-__m512bh test_mm512_castpbf16256_pbh512(__m256bh __a) {
- // CHECK-LABEL: test_mm512_castpbf16256_pbh512
+__m512bh test_mm512_castbf16256_pbh512(__m256bh __a) {
+ // CHECK-LABEL: test_mm512_castbf16256_pbh512
// CHECK: shufflevector <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <32 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison>
- return _mm512_castpbf16256_pbh512(__a);
+ return _mm512_castbf16256_pbh512(__a);
}
-__m512bh test_mm512_zextpbf16128_pbh512(__m128bh __a) {
- // CHECK-LABEL: test_mm512_zextpbf16128_pbh512
+__m512bh test_mm512_zextbf16128_pbh512(__m128bh __a) {
+ // CHECK-LABEL: test_mm512_zextbf16128_pbh512
// CHECK: shufflevector <8 x bfloat> %{{.*}}, <8 x bfloat> {{.*}}, <32 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
- return _mm512_zextpbf16128_pbh512(__a);
+ return _mm512_zextbf16128_pbh512(__a);
}
-__m512bh test_mm512_zextpbf16256_pbh512(__m256bh __a) {
- // CHECK-LABEL: test_mm512_zextpbf16256_pbh512
+__m512bh test_mm512_zextbf16256_pbh512(__m256bh __a) {
+ // CHECK-LABEL: test_mm512_zextbf16256_pbh512
// CHECK: shufflevector <16 x bfloat> %{{.*}}, <16 x bfloat> {{.*}}, <32 x i32>
- return _mm512_zextpbf16256_pbh512(__a);
+ return _mm512_zextbf16256_pbh512(__a);
}
__m512bh test_mm512_abs_pbh(__m512bh a) {
@@ -277,110 +277,110 @@ __m512bh test_mm512_permutexvar_epi16(__m512i __A, __m512bh __B) {
return _mm512_permutexvar_pbh(__A, __B);
}
-__m512bh test_mm512_addne_pbh(__m512bh __A, __m512bh __B) {
- // CHECK-LABEL: @test_mm512_addne_pbh
+__m512bh test_mm512_add_pbh(__m512bh __A, __m512bh __B) {
+ // CHECK-LABEL: @test_mm512_add_pbh
// CHECK: %{{.*}} = fadd <32 x bfloat> %{{.*}}, %{{.*}}
- return _mm512_addne_pbh(__A, __B);
+ return _mm512_add_pbh(__A, __B);
}
-__m512bh test_mm512_mask_addne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
+__m512bh test_mm512_mask_add_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
// CHECK: %{{.*}} = fadd <32 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_mask_addne_pbh(__W, __U, __A, __B);
+ return _mm512_mask_add_pbh(__W, __U, __A, __B);
}
-__m512bh test_mm512_maskz_addne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
+__m512bh test_mm512_maskz_add_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
// CHECK: %{{.*}} = fadd <32 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_maskz_addne_pbh(__U, __A, __B);
+ return _mm512_maskz_add_pbh(__U, __A, __B);
}
-__m512bh test_mm512_subne_pbh(__m512bh __A, __m512bh __B) {
- // CHECK-LABEL: @test_mm512_subne_pbh
+__m512bh test_mm512_sub_pbh(__m512bh __A, __m512bh __B) {
+ // CHECK-LABEL: @test_mm512_sub_pbh
// CHECK: %{{.*}} = fsub <32 x bfloat> %{{.*}}, %{{.*}}
- return _mm512_subne_pbh(__A, __B);
+ return _mm512_sub_pbh(__A, __B);
}
-__m512bh test_mm512_mask_subne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
+__m512bh test_mm512_mask_sub_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
// CHECK: %{{.*}} = fsub <32 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_mask_subne_pbh(__W, __U, __A, __B);
+ return _mm512_mask_sub_pbh(__W, __U, __A, __B);
}
-__m512bh test_mm512_maskz_subne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
+__m512bh test_mm512_maskz_sub_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
// CHECK: %{{.*}} = fsub <32 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_maskz_subne_pbh(__U, __A, __B);
+ return _mm512_maskz_sub_pbh(__U, __A, __B);
}
-__m512bh test_mm512_mulne_pbh(__m512bh __A, __m512bh __B) {
- // CHECK-LABEL: @test_mm512_mulne_pbh
+__m512bh test_mm512_mul_pbh(__m512bh __A, __m512bh __B) {
+ // CHECK-LABEL: @test_mm512_mul_pbh
// CHECK: %{{.*}} = fmul <32 x bfloat> %{{.*}}, %{{.*}}
- return _mm512_mulne_pbh(__A, __B);
+ return _mm512_mul_pbh(__A, __B);
}
-__m512bh test_mm512_mask_mulne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
+__m512bh test_mm512_mask_mul_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
// CHECK: %{{.*}} = fmul <32 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_mask_mulne_pbh(__W, __U, __A, __B);
+ return _mm512_mask_mul_pbh(__W, __U, __A, __B);
}
-__m512bh test_mm512_maskz_mulne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
+__m512bh test_mm512_maskz_mul_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
// CHECK: %{{.*}} = fmul <32 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_maskz_mulne_pbh(__U, __A, __B);
+ return _mm512_maskz_mul_pbh(__U, __A, __B);
}
-__m512bh test_mm512_divne_pbh(__m512bh __A, __m512bh __B) {
- // CHECK-LABEL: @test_mm512_divne_pbh
+__m512bh test_mm512_div_pbh(__m512bh __A, __m512bh __B) {
+ // CHECK-LABEL: @test_mm512_div_pbh
// CHECK: %{{.*}} = fdiv <32 x bfloat> %{{.*}}, %{{.*}}
- return _mm512_divne_pbh(__A, __B);
+ return _mm512_div_pbh(__A, __B);
}
-__m512bh test_mm512_mask_divne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
+__m512bh test_mm512_mask_div_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
// CHECK: %{{.*}} = fdiv <32 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_mask_divne_pbh(__W, __U, __A, __B);
+ return _mm512_mask_div_pbh(__W, __U, __A, __B);
}
-__m512bh test_mm512_maskz_divne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
+__m512bh test_mm512_maskz_div_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
// CHECK: %{{.*}} = fdiv <32 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_maskz_divne_pbh(__U, __A, __B);
+ return _mm512_maskz_div_pbh(__U, __A, __B);
}
__m512bh test_mm512_max_pbh(__m512bh __A, __m512bh __B) {
// CHECK-LABEL: @test_mm512_max_pbh
- // CHECK: @llvm.x86.avx10.vmaxpbf16512(
+ // CHECK: @llvm.x86.avx10.vmaxbf16512(
return _mm512_max_pbh(__A, __B);
}
__m512bh test_mm512_mask_max_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
- // CHECK: @llvm.x86.avx10.vmaxpbf16512
+ // CHECK: @llvm.x86.avx10.vmaxbf16512
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
return _mm512_mask_max_pbh(__W, __U, __A, __B);
}
__m512bh test_mm512_maskz_max_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
- // CHECK: @llvm.x86.avx10.vmaxpbf16512
+ // CHECK: @llvm.x86.avx10.vmaxbf16512
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
return _mm512_maskz_max_pbh(__U, __A, __B);
}
__m512bh test_mm512_min_pbh(__m512bh __A, __m512bh __B) {
// CHECK-LABEL: @test_mm512_min_pbh
- // CHECK: @llvm.x86.avx10.vminpbf16512(
+ // CHECK: @llvm.x86.avx10.vminbf16512(
return _mm512_min_pbh(__A, __B);
}
__m512bh test_mm512_mask_min_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
- // CHECK: @llvm.x86.avx10.vminpbf16512
+ // CHECK: @llvm.x86.avx10.vminbf16512
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
return _mm512_mask_min_pbh(__W, __U, __A, __B);
}
__m512bh test_mm512_maskz_min_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
- // CHECK: @llvm.x86.avx10.vminpbf16512
+ // CHECK: @llvm.x86.avx10.vminbf16512
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
return _mm512_maskz_min_pbh(__U, __A, __B);
}
@@ -802,139 +802,139 @@ __mmask32 test_mm512_mask_cmp_pbh_mask_true_us(__mmask32 m, __m512bh a, __m512bh
__mmask32 test_mm512_mask_fpclass_pbh_mask(__mmask32 __U, __m512bh __A) {
// CHECK-LABEL: @test_mm512_mask_fpclass_pbh_mask
- // CHECK: @llvm.x86.avx10.fpclass.nepbf16.512
+ // CHECK: @llvm.x86.avx10.fpclass.bf16.512
return _mm512_mask_fpclass_pbh_mask(__U, __A, 4);
}
__mmask32 test_mm512_fpclass_pbh_mask(__m512bh __A) {
// CHECK-LABEL: @test_mm512_fpclass_pbh_mask
- // CHECK: @llvm.x86.avx10.fpclass.nepbf16.512
+ // CHECK: @llvm.x86.avx10.fpclass.bf16.512
return _mm512_fpclass_pbh_mask(__A, 4);
}
__m512bh test_mm512_scalef_pbh(__m512bh __A, __m512bh __B) {
// CHECK-LABEL: @test_mm512_scalef_pbh
- // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.scalef.bf16.512
return _mm512_scalef_pbh(__A, __B);
}
__m512bh test_mm512_mask_scalef_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) {
// CHECK-LABEL: @test_mm512_mask_scalef_pbh
- // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.scalef.bf16.512
return _mm512_mask_scalef_pbh(__W, __U, __A, __B);
}
__m512bh test_mm512_maskz_scalef_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) {
// CHECK-LABEL: @test_mm512_maskz_scalef_pbh
- // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.scalef.bf16.512
return _mm512_maskz_scalef_pbh(__U, __A, __B);
}
__m512bh test_mm512_rcp_pbh(__m512bh __A) {
// CHECK-LABEL: @test_mm512_rcp_pbh
- // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.rcp.bf16.512
return _mm512_rcp_pbh(__A);
}
__m512bh test_mm512_mask_rcp_pbh(__m512bh __W, __mmask32 __U, __m512bh __A) {
// CHECK-LABEL: @test_mm512_mask_rcp_pbh
- // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.rcp.bf16.512
return (__m512bh)_mm512_mask_rcp_pbh(__W, __U, __A);
}
__m512bh test_mm512_maskz_rcp_pbh(__mmask32 __U, __m512bh __A) {
// CHECK-LABEL: @test_mm512_maskz_rcp_pbh
- // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.rcp.bf16.512
return _mm512_maskz_rcp_pbh(__U, __A);
}
__m512bh test_mm512_getexp_pbh(__m512bh __A) {
// CHECK-LABEL: @test_mm512_getexp_pbh
- // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.getexp.bf16.512
return _mm512_getexp_pbh(__A);
}
__m512bh test_mm512_mask_getexp_pbh(__m512bh __W, __mmask32 __U, __m512bh __A) {
// CHECK-LABEL: @test_mm512_mask_getexp_pbh
- // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.getexp.bf16.512
return _mm512_mask_getexp_pbh(__W, __U, __A);
}
__m512bh test_mm512_maskz_getexp_pbh(__mmask32 __U, __m512bh __A) {
// CHECK-LABEL: @test_mm512_maskz_getexp_pbh
- // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.getexp.bf16.512
return _mm512_maskz_getexp_pbh(__U, __A);
}
__m512bh test_mm512_rsqrt_pbh(__m512bh __A) {
// CHECK-LABEL: @test_mm512_rsqrt_pbh
- // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.512
return _mm512_rsqrt_pbh(__A);
}
__m512bh test_mm512_mask_rsqrt_pbh(__m512bh __W, __mmask32 __U, __m512bh __A) {
// CHECK-LABEL: @test_mm512_mask_rsqrt_pbh
- // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.512
return (__m512bh)_mm512_mask_rsqrt_pbh(__W, __U, __A);
}
__m512bh test_mm512_maskz_rsqrt_pbh(__mmask32 __U, __m512bh __A) {
// CHECK-LABEL: @test_mm512_maskz_rsqrt_pbh
- // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.512
return _mm512_maskz_rsqrt_pbh(__U, __A);
}
-__m512bh test_mm512_reducene_pbh(__m512bh __A) {
- // CHECK-LABEL: @test_mm512_reducene_pbh
- // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.512
- return _mm512_reducene_pbh(__A, 3);
+__m512bh test_mm512_reduce_pbh(__m512bh __A) {
+ // CHECK-LABEL: @test_mm512_reduce_pbh
+ // CHECK: @llvm.x86.avx10.mask.reduce.bf16.512
+ return _mm512_reduce_pbh(__A, 3);
}
-__m512bh test_mm512_mask_reducene_pbh(__m512bh __W, __mmask16 __U, __m512bh __A) {
- // CHECK-LABEL: @test_mm512_mask_reducene_pbh
- // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.512
- return _mm512_mask_reducene_pbh(__W, __U, __A, 1);
+__m512bh test_mm512_mask_reduce_pbh(__m512bh __W, __mmask16 __U, __m512bh __A) {
+ // CHECK-LABEL: @test_mm512_mask_reduce_pbh
+ // CHECK: @llvm.x86.avx10.mask.reduce.bf16.512
+ return _mm512_mask_reduce_pbh(__W, __U, __A, 1);
}
-__m512bh test_mm512_maskz_reducene_pbh(__mmask16 __U, __m512bh __A) {
- // CHECK-LABEL: @test_mm512_maskz_reducene_pbh
- // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.512
- return _mm512_maskz_reducene_pbh(__U, __A, 1);
+__m512bh test_mm512_maskz_reduce_pbh(__mmask16 __U, __m512bh __A) {
+ // CHECK-LABEL: @test_mm512_maskz_reduce_pbh
+ // CHECK: @llvm.x86.avx10.mask.reduce.bf16.512
+ return _mm512_maskz_reduce_pbh(__U, __A, 1);
}
-__m512bh test_mm512_roundscalene_pbh(__m512bh __A) {
- // CHECK-LABEL: @test_mm512_roundscalene_pbh
- // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.512
- return _mm512_roundscalene_pbh(__A, 3);
+__m512bh test_mm512_roundscale_pbh(__m512bh __A) {
+ // CHECK-LABEL: @test_mm512_roundscale_pbh
+ // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.512
+ return _mm512_roundscale_pbh(__A, 3);
}
-__m512bh test_mm512_mask_roundscalene_pbh(__m512bh __W, __mmask16 __U, __m512bh __A) {
- // CHECK-LABEL: @test_mm512_mask_roundscalene_pbh
- // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.512
- return _mm512_mask_roundscalene_pbh(__W, __U, __A, 1);
+__m512bh test_mm512_mask_roundscale_pbh(__m512bh __W, __mmask16 __U, __m512bh __A) {
+ // CHECK-LABEL: @test_mm512_mask_roundscale_pbh
+ // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.512
+ return _mm512_mask_roundscale_pbh(__W, __U, __A, 1);
}
-__m512bh test_mm512_maskz_roundscalene_pbh(__mmask16 __U, __m512bh __A) {
- // CHECK-LABEL: @test_mm512_maskz_roundscalene_pbh
- // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.512
- return _mm512_maskz_roundscalene_pbh(__U, __A, 1 );
+__m512bh test_mm512_maskz_roundscale_pbh(__mmask16 __U, __m512bh __A) {
+ // CHECK-LABEL: @test_mm512_maskz_roundscale_pbh
+ // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.512
+ return _mm512_maskz_roundscale_pbh(__U, __A, 1 );
}
__m512bh test_mm512_getmant_pbh(__m512bh __A) {
// CHECK-LABEL: @test_mm512_getmant_pbh
- // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.getmant.bf16.512
return _mm512_getmant_pbh(__A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan);
}
__m512bh test_mm512_mask_getmant_pbh(__m512bh __W, __mmask32 __U, __m512bh __A) {
// CHECK-LABEL: @test_mm512_mask_getmant_pbh
- // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.getmant.bf16.512
return _mm512_mask_getmant_pbh(__W, __U, __A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan);
}
__m512bh test_mm512_maskz_getmant_pbh(__mmask32 __U, __m512bh __A) {
// CHECK-LABEL: @test_mm512_maskz_getmant_pbh
- // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.512
+ // CHECK: @llvm.x86.avx10.mask.getmant.bf16.512
return _mm512_maskz_getmant_pbh(__U, __A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan);
}
@@ -960,126 +960,126 @@ __m512bh test_mm512_maskz_sqrt_pbh(__mmask32 __U, __m512bh __A) {
return _mm512_maskz_sqrt_pbh(__U, __A);
}
-__m512bh test_mm512_fmaddne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
- // CHECK-LABEL: @test_mm512_fmaddne_pbh
+__m512bh test_mm512_fmadd_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
+ // CHECK-LABEL: @test_mm512_fmadd_pbh
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
- return _mm512_fmaddne_pbh(__A, __B, __C);
+ return _mm512_fmadd_pbh(__A, __B, __C);
}
-__m512bh test_mm512_mask_fmaddne_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) {
- // CHECK-LABEL: @test_mm512_mask_fmaddne_pbh
+__m512bh test_mm512_mask_fmadd_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) {
+ // CHECK-LABEL: @test_mm512_mask_fmadd_pbh
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_mask_fmaddne_pbh(__A, __U, __B, __C);
+ return _mm512_mask_fmadd_pbh(__A, __U, __B, __C);
}
-__m512bh test_mm512_mask3_fmaddne_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) {
- // CHECK-LABEL: @test_mm512_mask3_fmaddne_pbh
+__m512bh test_mm512_mask3_fmadd_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) {
+ // CHECK-LABEL: @test_mm512_mask3_fmadd_pbh
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_mask3_fmaddne_pbh(__A, __B, __C, __U);
+ return _mm512_mask3_fmadd_pbh(__A, __B, __C, __U);
}
-__m512bh test_mm512_maskz_fmaddne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) {
- // CHECK-LABEL: @test_mm512_maskz_fmaddne_pbh
+__m512bh test_mm512_maskz_fmadd_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) {
+ // CHECK-LABEL: @test_mm512_maskz_fmadd_pbh
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_maskz_fmaddne_pbh(__U, __A, __B, __C);
+ return _mm512_maskz_fmadd_pbh(__U, __A, __B, __C);
}
-__m512bh test_mm512_fmsubne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
- // CHECK-LABEL: @test_mm512_fmsubne_pbh
+__m512bh test_mm512_fmsub_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
+ // CHECK-LABEL: @test_mm512_fmsub_pbh
// CHECK: fneg
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
- return _mm512_fmsubne_pbh(__A, __B, __C);
+ return _mm512_fmsub_pbh(__A, __B, __C);
}
-__m512bh test_mm512_mask_fmsubne_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) {
- // CHECK-LABEL: @test_mm512_mask_fmsubne_pbh
+__m512bh test_mm512_mask_fmsub_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) {
+ // CHECK-LABEL: @test_mm512_mask_fmsub_pbh
// CHECK: fneg
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_mask_fmsubne_pbh(__A, __U, __B, __C);
+ return _mm512_mask_fmsub_pbh(__A, __U, __B, __C);
}
-__m512bh test_mm512_mask3_fmsubne_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) {
- // CHECK-LABEL: @test_mm512_mask3_fmsubne_pbh
+__m512bh test_mm512_mask3_fmsub_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) {
+ // CHECK-LABEL: @test_mm512_mask3_fmsub_pbh
// CHECK: fneg
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_mask3_fmsubne_pbh(__A, __B, __C, __U);
+ return _mm512_mask3_fmsub_pbh(__A, __B, __C, __U);
}
-__m512bh test_mm512_maskz_fmsubne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) {
- // CHECK-LABEL: @test_mm512_maskz_fmsubne_pbh
+__m512bh test_mm512_maskz_fmsub_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) {
+ // CHECK-LABEL: @test_mm512_maskz_fmsub_pbh
// CHECK: fneg
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_maskz_fmsubne_pbh(__U, __A, __B, __C);
+ return _mm512_maskz_fmsub_pbh(__U, __A, __B, __C);
}
-__m512bh test_mm512_fnmaddne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
- // CHECK-LABEL: @test_mm512_fnmaddne_pbh
+__m512bh test_mm512_fnmadd_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
+ // CHECK-LABEL: @test_mm512_fnmadd_pbh
// CHECK: fneg
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
- return _mm512_fnmaddne_pbh(__A, __B, __C);
+ return _mm512_fnmadd_pbh(__A, __B, __C);
}
-__m512bh test_mm512_mask_fnmaddne_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) {
- // CHECK-LABEL: @test_mm512_mask_fnmaddne_pbh
+__m512bh test_mm512_mask_fnmadd_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) {
+ // CHECK-LABEL: @test_mm512_mask_fnmadd_pbh
// CHECK: fneg
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_mask_fnmaddne_pbh(__A, __U, __B, __C);
+ return _mm512_mask_fnmadd_pbh(__A, __U, __B, __C);
}
-__m512bh test_mm512_mask3_fnmaddne_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) {
- // CHECK-LABEL: @test_mm512_mask3_fnmaddne_pbh
+__m512bh test_mm512_mask3_fnmadd_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) {
+ // CHECK-LABEL: @test_mm512_mask3_fnmadd_pbh
// CHECK: fneg
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_mask3_fnmaddne_pbh(__A, __B, __C, __U);
+ return _mm512_mask3_fnmadd_pbh(__A, __B, __C, __U);
}
-__m512bh test_mm512_maskz_fnmaddne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) {
- // CHECK-LABEL: @test_mm512_maskz_fnmaddne_pbh
+__m512bh test_mm512_maskz_fnmadd_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) {
+ // CHECK-LABEL: @test_mm512_maskz_fnmadd_pbh
// CHECK: fneg
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_maskz_fnmaddne_pbh(__U, __A, __B, __C);
+ return _mm512_maskz_fnmadd_pbh(__U, __A, __B, __C);
}
-__m512bh test_mm512_fnmsubne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
- // CHECK-LABEL: @test_mm512_fnmsubne_pbh
+__m512bh test_mm512_fnmsub_pbh(__m512bh __A, __m512bh __B, __m512bh __C) {
+ // CHECK-LABEL: @test_mm512_fnmsub_pbh
// CHECK: fneg
// CHECK: fneg
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
- return _mm512_fnmsubne_pbh(__A, __B, __C);
+ return _mm512_fnmsub_pbh(__A, __B, __C);
}
-__m512bh test_mm512_mask_fnmsubne_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) {
- // CHECK-LABEL: @test_mm512_mask_fnmsubne_pbh
+__m512bh test_mm512_mask_fnmsub_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) {
+ // CHECK-LABEL: @test_mm512_mask_fnmsub_pbh
// CHECK: fneg
// CHECK: fneg
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_mask_fnmsubne_pbh(__A, __U, __B, __C);
+ return _mm512_mask_fnmsub_pbh(__A, __U, __B, __C);
}
-__m512bh test_mm512_mask3_fnmsubne_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) {
- // CHECK-LABEL: @test_mm512_mask3_fnmsubne_pbh
+__m512bh test_mm512_mask3_fnmsub_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) {
+ // CHECK-LABEL: @test_mm512_mask3_fnmsub_pbh
// CHECK: fneg
// CHECK: fneg
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_mask3_fnmsubne_pbh(__A, __B, __C, __U);
+ return _mm512_mask3_fnmsub_pbh(__A, __B, __C, __U);
}
-__m512bh test_mm512_maskz_fnmsubne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) {
- // CHECK-LABEL: @test_mm512_maskz_fnmsubne_pbh
+__m512bh test_mm512_maskz_fnmsub_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) {
+ // CHECK-LABEL: @test_mm512_maskz_fnmsub_pbh
// CHECK: fneg
// CHECK: fneg
// CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}})
// CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}
- return _mm512_maskz_fnmsubne_pbh(__U, __A, __B, __C);
+ return _mm512_maskz_fnmsub_pbh(__U, __A, __B, __C);
}
diff --git a/clang/test/CodeGen/X86/avx10_2bf16-builtins.c b/clang/test/CodeGen/X86/avx10_2bf16-builtins.c
index 9935137ca86775..931381af5df759 100644
--- a/clang/test/CodeGen/X86/avx10_2bf16-builtins.c
+++ b/clang/test/CodeGen/X86/avx10_2bf16-builtins.c
@@ -164,28 +164,28 @@ __m256bh test_mm256_setr_pbh(__bf16 bf1, __bf16 bf2, __bf16 bf3, __bf16 bf4,
bf9, bf10, bf11, bf12, bf13, bf14, bf15, bf16);
}
-__m128 test_mm_castpbf16_ps(__m128bh A) {
- // CHECK-LABEL: test_mm_castpbf16_ps
+__m128 test_mm_castbf16_ps(__m128bh A) {
+ // CHECK-LABEL: test_mm_castbf16_ps
// CHECK: bitcast <8 x bfloat> %{{.*}} to <4 x float>
- return _mm_castpbf16_ps(A);
+ return _mm_castbf16_ps(A);
}
-__m256 test_mm256_castpbf16_ps(__m256bh A) {
- // CHECK-LABEL: test_mm256_castpbf16_ps
+__m256 test_mm256_castbf16_ps(__m256bh A) {
+ // CHECK-LABEL: test_mm256_castbf16_ps
// CHECK: bitcast <16 x bfloat> %{{.*}} to <8 x float>
- return _mm256_castpbf16_ps(A);
+ return _mm256_castbf16_ps(A);
}
-__m128i test_mm_castpbf16_si128(__m128bh A) {
- // CHECK-LABEL: test_mm_castpbf16_si128
+__m128i test_mm_castbf16_si128(__m128bh A) {
+ // CHECK-LABEL: test_mm_castbf16_si128
// CHECK: bitcast <8 x bfloat> %{{.*}} to <2 x i64>
- return _mm_castpbf16_si128(A);
+ return _mm_castbf16_si128(A);
}
-__m256i test_mm256_castpbf16_si256(__m256bh A) {
- // CHECK-LABEL: test_mm256_castpbf16_si256
+__m256i test_mm256_castbf16_si256(__m256bh A) {
+ // CHECK-LABEL: test_mm256_castbf16_si256
// CHECK: bitcast <16 x bfloat> %{{.*}} to <4 x i64>
- return _mm256_castpbf16_si256(A);
+ return _mm256_castbf16_si256(A);
}
__m128bh test_mm_castps_pbh(__m128 A) {
@@ -224,34 +224,34 @@ __m256bh test_mm256_castsi256_pbh(__m256i A) {
return _mm256_castsi256_pbh(A);
}
-__m128d test_mm_castpbf16_pd(__m128bh A) {
- // CHECK-LABEL: test_mm_castpbf16_pd
+__m128d test_mm_castbf16_pd(__m128bh A) {
+ // CHECK-LABEL: test_mm_castbf16_pd
// CHECK: bitcast <8 x bfloat> %{{.*}} to <2 x double>
- return _mm_castpbf16_pd(A);
+ return _mm_castbf16_pd(A);
}
-__m128bh test_mm256_castpbf16256_pbh128(__m256bh __a) {
- // CHECK-LABEL: test_mm256_castpbf16256_pbh128
+__m128bh test_mm256_castbf16256_pbh128(__m256bh __a) {
+ // CHECK-LABEL: test_mm256_castbf16256_pbh128
// CHECK: shufflevector <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
- return _mm256_castpbf16256_pbh128(__a);
+ return _mm256_castbf16256_pbh128(__a);
}
-__m256bh test_mm256_castpbf16128_pbh256(__m128bh __a) {
- // CHECK-LABEL: test_mm256_castpbf16128_pbh256
+__m256bh test_mm256_castbf16128_pbh256(__m128bh __a) {
+ // CHECK-LABEL: test_mm256_castbf16128_pbh256
// CHECK: shufflevector <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison>
- return _mm256_castpbf16128_pbh256(__a);
+ return _mm256_castbf16128_pbh256(__a);
}
-__m256d test_mm256_castpbf16_pd(__m256bh A) {
- // CHECK-LABEL: test_mm256_castpbf16_pd
+__m256d test_mm256_castbf16_pd(__m256bh A) {
+ // CHECK-LABEL: test_mm256_castbf16_pd
// CHECK: bitcast <16 x bfloat> %{{.*}} to <4 x double>
- return _mm256_castpbf16_pd(A);
+ return _mm256_castbf16_pd(A);
}
-__m256bh test_mm256_zextpbf16128_pbh256(__m128bh __a) {
- // CHECK-LABEL: test_mm256_zextpbf16128_pbh256
+__m256bh test_mm256_zextbf16128_pbh256(__m128bh __a) {
+ // CHECK-LABEL: test_mm256_zextbf16128_pbh256
// CHECK: shufflevector <8 x bfloat> %{{.*}}, <8 x bfloat> {{.*}}, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
- return _mm256_zextpbf16128_pbh256(__a);
+ return _mm256_zextbf16128_pbh256(__a);
}
__m128bh test_mm_abs_pbh(__m128bh a) {
@@ -432,218 +432,218 @@ __m256bh test_mm256_permutexvar_pbh(__m256i __A, __m256bh __B) {
return _mm256_permutexvar_pbh(__A, __B);
}
-__m256bh test_mm256_addne_pbh(__m256bh __A, __m256bh __B) {
- // CHECK-LABEL: @test_mm256_addne_pbh
+__m256bh test_mm256_add_pbh(__m256bh __A, __m256bh __B) {
+ // CHECK-LABEL: @test_mm256_add_pbh
// CHECK: %{{.*}} = fadd <16 x bfloat> %{{.*}}, %{{.*}}
- return _mm256_addne_pbh(__A, __B);
+ return _mm256_add_pbh(__A, __B);
}
-__m256bh test_mm256_mask_addne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
+__m256bh test_mm256_mask_add_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
// CHECK: %{{.*}} = fadd <16 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return (__m256bh)_mm256_mask_addne_pbh(__W, __U, __A, __B);
+ return (__m256bh)_mm256_mask_add_pbh(__W, __U, __A, __B);
}
-__m256bh test_mm256_maskz_addne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
+__m256bh test_mm256_maskz_add_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
// CHECK: %{{.*}} = fadd <16 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_maskz_addne_pbh(__U, __A, __B);
+ return _mm256_maskz_add_pbh(__U, __A, __B);
}
-__m128bh test_mm_addne_pbh(__m128bh __A, __m128bh __B) {
- // CHECK-LABEL: @test_mm_addne_pbh
+__m128bh test_mm_add_pbh(__m128bh __A, __m128bh __B) {
+ // CHECK-LABEL: @test_mm_add_pbh
// CHECK: %{{.*}} = fadd <8 x bfloat> %{{.*}}, %{{.*}}
- return _mm_addne_pbh(__A, __B);
+ return _mm_add_pbh(__A, __B);
}
-__m128bh test_mm_mask_addne_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) {
+__m128bh test_mm_mask_add_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) {
// CHECK: %{{.*}} = fadd <8 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return (__m128bh)_mm_mask_addne_pbh(__W, __U, __A, __B);
+ return (__m128bh)_mm_mask_add_pbh(__W, __U, __A, __B);
}
-__m128bh test_mm_maskz_addne_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) {
+__m128bh test_mm_maskz_add_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) {
// CHECK: %{{.*}} = fadd <8 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_maskz_addne_pbh(__U, __A, __B);
+ return _mm_maskz_add_pbh(__U, __A, __B);
}
-__m256bh test_mm256_subne_pbh(__m256bh __A, __m256bh __B) {
- // CHECK-LABEL: @test_mm256_subne_pbh
+__m256bh test_mm256_sub_pbh(__m256bh __A, __m256bh __B) {
+ // CHECK-LABEL: @test_mm256_sub_pbh
// CHECK: %{{.*}} = fsub <16 x bfloat> %{{.*}}, %{{.*}}
- return _mm256_subne_pbh(__A, __B);
+ return _mm256_sub_pbh(__A, __B);
}
-__m256bh test_mm256_mask_subne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
+__m256bh test_mm256_mask_sub_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
// CHECK: %{{.*}} = fsub <16 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return (__m256bh)_mm256_mask_subne_pbh(__W, __U, __A, __B);
+ return (__m256bh)_mm256_mask_sub_pbh(__W, __U, __A, __B);
}
-__m256bh test_mm256_maskz_subne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
+__m256bh test_mm256_maskz_sub_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
// CHECK: %{{.*}} = fsub <16 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_maskz_subne_pbh(__U, __A, __B);
+ return _mm256_maskz_sub_pbh(__U, __A, __B);
}
-__m128bh test_mm_subne_pbh(__m128bh __A, __m128bh __B) {
- // CHECK-LABEL: @test_mm_subne_pbh
+__m128bh test_mm_sub_pbh(__m128bh __A, __m128bh __B) {
+ // CHECK-LABEL: @test_mm_sub_pbh
// CHECK: %{{.*}} = fsub <8 x bfloat> %{{.*}}, %{{.*}}
- return _mm_subne_pbh(__A, __B);
+ return _mm_sub_pbh(__A, __B);
}
-__m128bh test_mm_mask_subne_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) {
+__m128bh test_mm_mask_sub_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) {
// CHECK: %{{.*}} = fsub <8 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return (__m128bh)_mm_mask_subne_pbh(__W, __U, __A, __B);
+ return (__m128bh)_mm_mask_sub_pbh(__W, __U, __A, __B);
}
-__m128bh test_mm_maskz_subne_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) {
+__m128bh test_mm_maskz_sub_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) {
// CHECK: %{{.*}} = fsub <8 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_maskz_subne_pbh(__U, __A, __B);
+ return _mm_maskz_sub_pbh(__U, __A, __B);
}
-__m256bh test_mm256_mulne_pbh(__m256bh __A, __m256bh __B) {
- // CHECK-LABEL: @test_mm256_mulne_pbh
+__m256bh test_mm256_mul_pbh(__m256bh __A, __m256bh __B) {
+ // CHECK-LABEL: @test_mm256_mul_pbh
// CHECK: %{{.*}} = fmul <16 x bfloat> %{{.*}}, %{{.*}}
- return _mm256_mulne_pbh(__A, __B);
+ return _mm256_mul_pbh(__A, __B);
}
-__m256bh test_mm256_mask_mulne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
+__m256bh test_mm256_mask_mul_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
// CHECK: %{{.*}} = fmul <16 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return (__m256bh)_mm256_mask_mulne_pbh(__W, __U, __A, __B);
+ return (__m256bh)_mm256_mask_mul_pbh(__W, __U, __A, __B);
}
-__m256bh test_mm256_maskz_mulne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
+__m256bh test_mm256_maskz_mul_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
// CHECK: %{{.*}} = fmul <16 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_maskz_mulne_pbh(__U, __A, __B);
+ return _mm256_maskz_mul_pbh(__U, __A, __B);
}
-__m128bh test_mm_mulne_pbh(__m128bh __A, __m128bh __B) {
- // CHECK-LABEL: @test_mm_mulne_pbh
+__m128bh test_mm_mul_pbh(__m128bh __A, __m128bh __B) {
+ // CHECK-LABEL: @test_mm_mul_pbh
// CHECK: %{{.*}} = fmul <8 x bfloat> %{{.*}}, %{{.*}}
- return _mm_mulne_pbh(__A, __B);
+ return _mm_mul_pbh(__A, __B);
}
-__m128bh test_mm_mask_mulne_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) {
+__m128bh test_mm_mask_mul_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) {
// CHECK: %{{.*}} = fmul <8 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return (__m128bh)_mm_mask_mulne_pbh(__W, __U, __A, __B);
+ return (__m128bh)_mm_mask_mul_pbh(__W, __U, __A, __B);
}
-__m128bh test_mm_maskz_mulne_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) {
+__m128bh test_mm_maskz_mul_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) {
// CHECK: %{{.*}} = fmul <8 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_maskz_mulne_pbh(__U, __A, __B);
+ return _mm_maskz_mul_pbh(__U, __A, __B);
}
-__m256bh test_mm256_divne_pbh(__m256bh __A, __m256bh __B) {
- // CHECK-LABEL: @test_mm256_divne_pbh
+__m256bh test_mm256_div_pbh(__m256bh __A, __m256bh __B) {
+ // CHECK-LABEL: @test_mm256_div_pbh
// CHECK: %{{.*}} = fdiv <16 x bfloat> %{{.*}}, %{{.*}}
- return _mm256_divne_pbh(__A, __B);
+ return _mm256_div_pbh(__A, __B);
}
-__m256bh test_mm256_mask_divne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
+__m256bh test_mm256_mask_div_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
// CHECK: %{{.*}} = fdiv <16 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return (__m256bh)_mm256_mask_divne_pbh(__W, __U, __A, __B);
+ return (__m256bh)_mm256_mask_div_pbh(__W, __U, __A, __B);
}
-__m256bh test_mm256_maskz_divne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
+__m256bh test_mm256_maskz_div_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
// CHECK: %{{.*}} = fdiv <16 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_maskz_divne_pbh(__U, __A, __B);
+ return _mm256_maskz_div_pbh(__U, __A, __B);
}
-__m128bh test_mm_divne_pbh(__m128bh __A, __m128bh __B) {
- // CHECK-LABEL: @test_mm_divne_pbh
+__m128bh test_mm_div_pbh(__m128bh __A, __m128bh __B) {
+ // CHECK-LABEL: @test_mm_div_pbh
// CHECK: %{{.*}} = fdiv <8 x bfloat> %{{.*}}, %{{.*}}
- return _mm_divne_pbh(__A, __B);
+ return _mm_div_pbh(__A, __B);
}
-__m128bh test_mm_mask_divne_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) {
+__m128bh test_mm_mask_div_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) {
// CHECK: %{{.*}} = fdiv <8 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return (__m128bh)_mm_mask_divne_pbh(__W, __U, __A, __B);
+ return (__m128bh)_mm_mask_div_pbh(__W, __U, __A, __B);
}
-__m128bh test_mm_maskz_divne_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) {
+__m128bh test_mm_maskz_div_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) {
// CHECK: %{{.*}} = fdiv <8 x bfloat> %{{.*}}, %{{.*}}
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_maskz_divne_pbh(__U, __A, __B);
+ return _mm_maskz_div_pbh(__U, __A, __B);
}
__m256bh test_mm256_max_pbh(__m256bh __A, __m256bh __B) {
// CHECK-LABEL: @test_mm256_max_pbh
- // CHECK: @llvm.x86.avx10.vmaxpbf16256(
+ // CHECK: @llvm.x86.avx10.vmaxbf16256(
return _mm256_max_pbh(__A, __B);
}
__m256bh test_mm256_mask_max_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
- // CHECK: @llvm.x86.avx10.vmaxpbf16256
+ // CHECK: @llvm.x86.avx10.vmaxbf16256
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
return (__m256bh)_mm256_mask_max_pbh(__W, __U, __A, __B);
}
__m256bh test_mm256_maskz_max_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
- // CHECK: @llvm.x86.avx10.vmaxpbf16256
+ // CHECK: @llvm.x86.avx10.vmaxbf16256
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
return _mm256_maskz_max_pbh(__U, __A, __B);
}
__m128bh test_mm_max_pbh(__m128bh __A, __m128bh __B) {
// CHECK-LABEL: @test_mm_max_pbh
- // CHECK: @llvm.x86.avx10.vmaxpbf16128(
+ // CHECK: @llvm.x86.avx10.vmaxbf16128(
return _mm_max_pbh(__A, __B);
}
__m128bh test_mm_mask_max_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) {
- // CHECK: @llvm.x86.avx10.vmaxpbf16128
+ // CHECK: @llvm.x86.avx10.vmaxbf16128
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
return (__m128bh)_mm_mask_max_pbh(__W, __U, __A, __B);
}
__m128bh test_mm_maskz_max_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) {
- // CHECK: @llvm.x86.avx10.vmaxpbf16128
+ // CHECK: @llvm.x86.avx10.vmaxbf16128
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
return _mm_maskz_max_pbh(__U, __A, __B);
}
__m256bh test_mm256_min_pbh(__m256bh __A, __m256bh __B) {
// CHECK-LABEL: @test_mm256_min_pbh
- // CHECK: @llvm.x86.avx10.vminpbf16256(
+ // CHECK: @llvm.x86.avx10.vminbf16256(
return _mm256_min_pbh(__A, __B);
}
__m256bh test_mm256_mask_min_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
- // CHECK: @llvm.x86.avx10.vminpbf16256
+ // CHECK: @llvm.x86.avx10.vminbf16256
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
return (__m256bh)_mm256_mask_min_pbh(__W, __U, __A, __B);
}
__m256bh test_mm256_maskz_min_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
- // CHECK: @llvm.x86.avx10.vminpbf16256
+ // CHECK: @llvm.x86.avx10.vminbf16256
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
return _mm256_maskz_min_pbh(__U, __A, __B);
}
__m128bh test_mm_min_pbh(__m128bh __A, __m128bh __B) {
// CHECK-LABEL: @test_mm_min_pbh
- // CHECK: @llvm.x86.avx10.vminpbf16128(
+ // CHECK: @llvm.x86.avx10.vminbf16128(
return _mm_min_pbh(__A, __B);
}
__m128bh test_mm_mask_min_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) {
- // CHECK: @llvm.x86.avx10.vminpbf16128
+ // CHECK: @llvm.x86.avx10.vminbf16128
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
return (__m128bh)_mm_mask_min_pbh(__W, __U, __A, __B);
}
__m128bh test_mm_maskz_min_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) {
- // CHECK: @llvm.x86.avx10.vminpbf16128
+ // CHECK: @llvm.x86.avx10.vminbf16128
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
return _mm_maskz_min_pbh(__U, __A, __B);
}
@@ -1519,151 +1519,151 @@ __mmask8 test_mm_mask_cmp_pbh_mask_true_us(__mmask8 m, __m128bh a, __m128bh b) {
__mmask16 test_mm256_mask_fpclass_pbh_mask(__mmask16 __U, __m256bh __A) {
// CHECK-LABEL: @test_mm256_mask_fpclass_pbh_mask
- // CHECK: @llvm.x86.avx10.fpclass.nepbf16.256
+ // CHECK: @llvm.x86.avx10.fpclass.bf16.256
return _mm256_mask_fpclass_pbh_mask(__U, __A, 4);
}
__mmask16 test_mm256_fpclass_pbh_mask(__m256bh __A) {
// CHECK-LABEL: @test_mm256_fpclass_pbh_mask
- // CHECK: @llvm.x86.avx10.fpclass.nepbf16.256
+ // CHECK: @llvm.x86.avx10.fpclass.bf16.256
return _mm256_fpclass_pbh_mask(__A, 4);
}
__mmask8 test_mm_mask_fpclass_pbh_mask(__mmask8 __U, __m128bh __A) {
// CHECK-LABEL: @test_mm_mask_fpclass_pbh_mask
- // CHECK: @llvm.x86.avx10.fpclass.nepbf16.128
+ // CHECK: @llvm.x86.avx10.fpclass.bf16.128
return _mm_mask_fpclass_pbh_mask(__U, __A, 4);
}
__mmask8 test_mm_fpclass_pbh_mask(__m128bh __A) {
// CHECK-LABEL: @test_mm_fpclass_pbh_mask
- // CHECK: @llvm.x86.avx10.fpclass.nepbf16.128
+ // CHECK: @llvm.x86.avx10.fpclass.bf16.128
return _mm_fpclass_pbh_mask(__A, 4);
}
__m256bh test_mm256_scalef_pbh(__m256bh __A, __m256bh __B) {
// CHECK-LABEL: @test_mm256_scalef_pbh
- // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.scalef.bf16.256
return _mm256_scalef_pbh(__A, __B);
}
__m256bh test_mm256_mask_scalef_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) {
// CHECK-LABEL: @test_mm256_mask_scalef_pbh
- // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.scalef.bf16.256
return _mm256_mask_scalef_pbh(__W, __U, __A, __B);
}
__m256bh test_mm256_maskz_scalef_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) {
// CHECK-LABEL: @test_mm256_maskz_scalef_pbh
- // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.scalef.bf16.256
return _mm256_maskz_scalef_pbh(__U, __A, __B);
}
__m256bh test_mm256_rcp_pbh(__m256bh __A) {
// CHECK-LABEL: @test_mm256_rcp_pbh
- // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.rcp.bf16.256
return _mm256_rcp_pbh(__A);
}
__m256bh test_mm256_mask_rcp_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) {
// CHECK-LABEL: @test_mm256_mask_rcp_pbh
- // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.rcp.bf16.256
return (__m256bh)_mm256_mask_rcp_pbh(__W, __U, __A);
}
__m256bh test_mm256_maskz_rcp_pbh(__mmask16 __U, __m256bh __A) {
// CHECK-LABEL: @test_mm256_maskz_rcp_pbh
- // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.rcp.bf16.256
return _mm256_maskz_rcp_pbh(__U, __A);
}
__m256bh test_mm256_getexp_pbh(__m256bh __A) {
// CHECK-LABEL: @test_mm256_getexp_pbh
- // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.getexp.bf16.256
return _mm256_getexp_pbh(__A);
}
__m256bh test_mm256_mask_getexp_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) {
// CHECK-LABEL: @test_mm256_mask_getexp_pbh
- // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.getexp.bf16.256
return _mm256_mask_getexp_pbh(__W, __U, __A);
}
__m256bh test_mm256_maskz_getexp_pbh(__mmask16 __U, __m256bh __A) {
// CHECK-LABEL: @test_mm256_maskz_getexp_pbh
- // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.getexp.bf16.256
return _mm256_maskz_getexp_pbh(__U, __A);
}
__m256bh test_mm256_rsqrt_pbh(__m256bh __A) {
// CHECK-LABEL: @test_mm256_rsqrt_pbh
- // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.256
return _mm256_rsqrt_pbh(__A);
}
__m256bh test_mm256_mask_rsqrt_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) {
// CHECK-LABEL: @test_mm256_mask_rsqrt_pbh
- // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.256
return (__m256bh)_mm256_mask_rsqrt_pbh(__W, __U, __A);
}
__m256bh test_mm256_maskz_rsqrt_pbh(__mmask16 __U, __m256bh __A) {
// CHECK-LABEL: @test_mm256_maskz_rsqrt_pbh
- // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.256
return _mm256_maskz_rsqrt_pbh(__U, __A);
}
-__m256bh test_mm256_reducene_pbh(__m256bh __A) {
- // CHECK-LABEL: @test_mm256_reducene_pbh
- // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.256
- return _mm256_reducene_pbh(__A, 3);
+__m256bh test_mm256_reduce_pbh(__m256bh __A) {
+ // CHECK-LABEL: @test_mm256_reduce_pbh
+ // CHECK: @llvm.x86.avx10.mask.reduce.bf16.256
+ return _mm256_reduce_pbh(__A, 3);
}
-__m256bh test_mm256_mask_reducene_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) {
- // CHECK-LABEL: @test_mm256_mask_reducene_pbh
- // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.256
- return _mm256_mask_reducene_pbh(__W, __U, __A, 1);
+__m256bh test_mm256_mask_reduce_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) {
+ // CHECK-LABEL: @test_mm256_mask_reduce_pbh
+ // CHECK: @llvm.x86.avx10.mask.reduce.bf16.256
+ return _mm256_mask_reduce_pbh(__W, __U, __A, 1);
}
-__m256bh test_mm256_maskz_reducene_pbh(__mmask16 __U, __m256bh __A) {
- // CHECK-LABEL: @test_mm256_maskz_reducene_pbh
- // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.256
- return _mm256_maskz_reducene_pbh(__U, __A, 1);
+__m256bh test_mm256_maskz_reduce_pbh(__mmask16 __U, __m256bh __A) {
+ // CHECK-LABEL: @test_mm256_maskz_reduce_pbh
+ // CHECK: @llvm.x86.avx10.mask.reduce.bf16.256
+ return _mm256_maskz_reduce_pbh(__U, __A, 1);
}
-__m256bh test_mm256_roundscalene_pbh(__m256bh __A) {
- // CHECK-LABEL: @test_mm256_roundscalene_pbh
- // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.256
- return _mm256_roundscalene_pbh(__A, 3);
+__m256bh test_mm256_roundscale_pbh(__m256bh __A) {
+ // CHECK-LABEL: @test_mm256_roundscale_pbh
+ // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.256
+ return _mm256_roundscale_pbh(__A, 3);
}
-__m256bh test_mm256_mask_roundscalene_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) {
- // CHECK-LABEL: @test_mm256_mask_roundscalene_pbh
- // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.256
- return _mm256_mask_roundscalene_pbh(__W, __U, __A, 1);
+__m256bh test_mm256_mask_roundscale_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) {
+ // CHECK-LABEL: @test_mm256_mask_roundscale_pbh
+ // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.256
+ return _mm256_mask_roundscale_pbh(__W, __U, __A, 1);
}
-__m256bh test_mm256_maskz_roundscalene_pbh(__mmask16 __U, __m256bh __A) {
- // CHECK-LABEL: @test_mm256_maskz_roundscalene_pbh
- // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.256
- return _mm256_maskz_roundscalene_pbh(__U, __A, 1 );
+__m256bh test_mm256_maskz_roundscale_pbh(__mmask16 __U, __m256bh __A) {
+ // CHECK-LABEL: @test_mm256_maskz_roundscale_pbh
+ // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.256
+ return _mm256_maskz_roundscale_pbh(__U, __A, 1 );
}
__m256bh test_mm256_getmant_pbh(__m256bh __A) {
// CHECK-LABEL: @test_mm256_getmant_pbh
- // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.getmant.bf16.256
return _mm256_getmant_pbh(__A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan);
}
__m256bh test_mm256_mask_getmant_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) {
// CHECK-LABEL: @test_mm256_mask_getmant_pbh
- // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.getmant.bf16.256
return _mm256_mask_getmant_pbh(__W, __U, __A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan);
}
__m256bh test_mm256_maskz_getmant_pbh(__mmask16 __U, __m256bh __A) {
// CHECK-LABEL: @test_mm256_maskz_getmant_pbh
- // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.256
+ // CHECK: @llvm.x86.avx10.mask.getmant.bf16.256
return _mm256_maskz_getmant_pbh(__U, __A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan);
}
@@ -1689,127 +1689,127 @@ __m256bh test_mm256_maskz_sqrt_pbh(__mmask16 __U, __m256bh __A) {
__m128bh test_mm_scalef_pbh(__m128bh __A, __m128bh __B) {
// CHECK-LABEL: @test_mm_scalef_pbh
- // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.scalef.bf16.128
return _mm_scalef_pbh(__A, __B);
}
__m128bh test_mm_mask_scalef_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) {
// CHECK-LABEL: @test_mm_mask_scalef_pbh
- // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.scalef.bf16.128
return _mm_mask_scalef_pbh(__W, __U, __A, __B);
}
__m128bh test_mm_maskz_scalef_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) {
// CHECK-LABEL: @test_mm_maskz_scalef_pbh
- // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.scalef.bf16.128
return _mm_maskz_scalef_pbh(__U, __A, __B);
}
__m128bh test_mm_rcp_pbh(__m128bh __A) {
// CHECK-LABEL: @test_mm_rcp_pbh
- // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.rcp.bf16.128
return _mm_rcp_pbh(__A);
}
__m128bh test_mm_mask_rcp_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) {
// CHECK-LABEL: @test_mm_mask_rcp_pbh
- // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.rcp.bf16.128
return (__m128bh)_mm_mask_rcp_pbh(__W, __U, __A);
}
__m128bh test_mm_maskz_rcp_pbh(__mmask8 __U, __m128bh __A) {
// CHECK-LABEL: @test_mm_maskz_rcp_pbh
- // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.rcp.bf16.128
return _mm_maskz_rcp_pbh(__U, __A);
}
__m128bh test_mm_getexp_pbh(__m128bh __A) {
// CHECK-LABEL: @test_mm_getexp_pbh
- // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.getexp.bf16.128
return _mm_getexp_pbh(__A);
}
__m128bh test_mm_mask_getexp_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) {
// CHECK-LABEL: @test_mm_mask_getexp_pbh
- // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.getexp.bf16.128
return _mm_mask_getexp_pbh(__W, __U, __A);
}
__m128bh test_mm_maskz_getexp_pbh(__mmask8 __U, __m128bh __A) {
// CHECK-LABEL: @test_mm_maskz_getexp_pbh
- // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.getexp.bf16.128
return _mm_maskz_getexp_pbh(__U, __A);
}
__m128bh test_mm_rsqrt_pbh(__m128bh __A) {
// CHECK-LABEL: @test_mm_rsqrt_pbh
- // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.128
return _mm_rsqrt_pbh(__A);
}
__m128bh test_mm_mask_rsqrt_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) {
// CHECK-LABEL: @test_mm_mask_rsqrt_pbh
- // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.128
return (__m128bh)_mm_mask_rsqrt_pbh(__W, __U, __A);
}
__m128bh test_mm_maskz_rsqrt_pbh(__mmask8 __U, __m128bh __A) {
// CHECK-LABEL: @test_mm_maskz_rsqrt_pbh
- // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.128
return _mm_maskz_rsqrt_pbh(__U, __A);
}
-__m128bh test_mm_reducene_pbh(__m128bh __A) {
- // CHECK-LABEL: @test_mm_reducene_pbh
- // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.128
- return _mm_reducene_pbh(__A, 3);
+__m128bh test_mm_reduce_pbh(__m128bh __A) {
+ // CHECK-LABEL: @test_mm_reduce_pbh
+ // CHECK: @llvm.x86.avx10.mask.reduce.bf16.128
+ return _mm_reduce_pbh(__A, 3);
}
-__m128bh test_mm_mask_reducene_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) {
- // CHECK-LABEL: @test_mm_mask_reducene_pbh
- // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.128
- return _mm_mask_reducene_pbh(__W, __U, __A, 1);
+__m128bh test_mm_mask_reduce_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) {
+ // CHECK-LABEL: @test_mm_mask_reduce_pbh
+ // CHECK: @llvm.x86.avx10.mask.reduce.bf16.128
+ return _mm_mask_reduce_pbh(__W, __U, __A, 1);
}
-__m128bh test_mm_maskz_reducene_pbh(__mmask8 __U, __m128bh __A) {
- // CHECK-LABEL: @test_mm_maskz_reducene_pbh
- // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.128
- return _mm_maskz_reducene_pbh(__U, __A, 1);
+__m128bh test_mm_maskz_reduce_pbh(__mmask8 __U, __m128bh __A) {
+ // CHECK-LABEL: @test_mm_maskz_reduce_pbh
+ // CHECK: @llvm.x86.avx10.mask.reduce.bf16.128
+ return _mm_maskz_reduce_pbh(__U, __A, 1);
}
-__m128bh test_mm_roundscalene_pbh(__m128bh __A) {
- // CHECK-LABEL: @test_mm_roundscalene_pbh
- // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.128
- return _mm_roundscalene_pbh(__A, 3);
+__m128bh test_mm_roundscale_pbh(__m128bh __A) {
+ // CHECK-LABEL: @test_mm_roundscale_pbh
+ // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.128
+ return _mm_roundscale_pbh(__A, 3);
}
-__m128bh test_mm_mask_roundscalene_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) {
- // CHECK-LABEL: @test_mm_mask_roundscalene_pbh
- // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.128
- return _mm_mask_roundscalene_pbh(__W, __U, __A, 1);
+__m128bh test_mm_mask_roundscale_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) {
+ // CHECK-LABEL: @test_mm_mask_roundscale_pbh
+ // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.128
+ return _mm_mask_roundscale_pbh(__W, __U, __A, 1);
}
-__m128bh test_mm_maskz_roundscalene_pbh(__mmask8 __U, __m128bh __A) {
- // CHECK-LABEL: @test_mm_maskz_roundscalene_pbh
- // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.128
- return _mm_maskz_roundscalene_pbh(__U, __A, 1 );
+__m128bh test_mm_maskz_roundscale_pbh(__mmask8 __U, __m128bh __A) {
+ // CHECK-LABEL: @test_mm_maskz_roundscale_pbh
+ // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.128
+ return _mm_maskz_roundscale_pbh(__U, __A, 1 );
}
__m128bh test_mm_getmant_pbh(__m128bh __A) {
// CHECK-LABEL: @test_mm_getmant_pbh
- // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.getmant.bf16.128
return _mm_getmant_pbh(__A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan);
}
__m128bh test_mm_mask_getmant_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) {
// CHECK-LABEL: @test_mm_mask_getmant_pbh
- // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.getmant.bf16.128
return _mm_mask_getmant_pbh(__W, __U, __A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan);
}
__m128bh test_mm_maskz_getmant_pbh(__mmask8 __U, __m128bh __A) {
// CHECK-LABEL: @test_mm_maskz_getmant_pbh
- // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.128
+ // CHECK: @llvm.x86.avx10.mask.getmant.bf16.128
return _mm_maskz_getmant_pbh(__U, __A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan);
}
@@ -1833,250 +1833,250 @@ __m128bh test_mm_maskz_sqrt_pbh(__mmask8 __U, __m128bh __A) {
return _mm_maskz_sqrt_pbh(__U, __A);
}
-__m256bh test_mm256_fmaddne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
- // CHECK-LABEL: @test_mm256_fmaddne_pbh
+__m256bh test_mm256_fmadd_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
+ // CHECK-LABEL: @test_mm256_fmadd_pbh
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
- return _mm256_fmaddne_pbh(__A, __B, __C);
+ return _mm256_fmadd_pbh(__A, __B, __C);
}
-__m256bh test_mm256_mask_fmaddne_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) {
- // CHECK-LABEL: @test_mm256_mask_fmaddne_pbh
+__m256bh test_mm256_mask_fmadd_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) {
+ // CHECK-LABEL: @test_mm256_mask_fmadd_pbh
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_mask_fmaddne_pbh(__A, __U, __B, __C);
+ return _mm256_mask_fmadd_pbh(__A, __U, __B, __C);
}
-__m256bh test_mm256_mask3_fmaddne_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) {
- // CHECK-LABEL: @test_mm256_mask3_fmaddne_pbh
+__m256bh test_mm256_mask3_fmadd_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) {
+ // CHECK-LABEL: @test_mm256_mask3_fmadd_pbh
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_mask3_fmaddne_pbh(__A, __B, __C, __U);
+ return _mm256_mask3_fmadd_pbh(__A, __B, __C, __U);
}
-__m256bh test_mm256_maskz_fmaddne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) {
- // CHECK-LABEL: @test_mm256_maskz_fmaddne_pbh
+__m256bh test_mm256_maskz_fmadd_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) {
+ // CHECK-LABEL: @test_mm256_maskz_fmadd_pbh
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_maskz_fmaddne_pbh(__U, __A, __B, __C);
+ return _mm256_maskz_fmadd_pbh(__U, __A, __B, __C);
}
-__m256bh test_mm256_fmsubne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
- // CHECK-LABEL: @test_mm256_fmsubne_pbh
+__m256bh test_mm256_fmsub_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
+ // CHECK-LABEL: @test_mm256_fmsub_pbh
// CHECK: fneg
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
- return _mm256_fmsubne_pbh(__A, __B, __C);
+ return _mm256_fmsub_pbh(__A, __B, __C);
}
-__m256bh test_mm256_mask_fmsubne_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) {
- // CHECK-LABEL: @test_mm256_mask_fmsubne_pbh
+__m256bh test_mm256_mask_fmsub_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) {
+ // CHECK-LABEL: @test_mm256_mask_fmsub_pbh
// CHECK: fneg
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_mask_fmsubne_pbh(__A, __U, __B, __C);
+ return _mm256_mask_fmsub_pbh(__A, __U, __B, __C);
}
-__m256bh test_mm256_mask3_fmsubne_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) {
- // CHECK-LABEL: @test_mm256_mask3_fmsubne_pbh
+__m256bh test_mm256_mask3_fmsub_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) {
+ // CHECK-LABEL: @test_mm256_mask3_fmsub_pbh
// CHECK: fneg
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_mask3_fmsubne_pbh(__A, __B, __C, __U);
+ return _mm256_mask3_fmsub_pbh(__A, __B, __C, __U);
}
-__m256bh test_mm256_maskz_fmsubne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) {
- // CHECK-LABEL: @test_mm256_maskz_fmsubne_pbh
+__m256bh test_mm256_maskz_fmsub_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) {
+ // CHECK-LABEL: @test_mm256_maskz_fmsub_pbh
// CHECK: fneg
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_maskz_fmsubne_pbh(__U, __A, __B, __C);
+ return _mm256_maskz_fmsub_pbh(__U, __A, __B, __C);
}
-__m256bh test_mm256_fnmaddne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
- // CHECK-LABEL: @test_mm256_fnmaddne_pbh
+__m256bh test_mm256_fnmadd_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
+ // CHECK-LABEL: @test_mm256_fnmadd_pbh
// CHECK: fneg
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
- return _mm256_fnmaddne_pbh(__A, __B, __C);
+ return _mm256_fnmadd_pbh(__A, __B, __C);
}
-__m256bh test_mm256_mask_fnmaddne_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) {
- // CHECK-LABEL: @test_mm256_mask_fnmaddne_pbh
+__m256bh test_mm256_mask_fnmadd_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) {
+ // CHECK-LABEL: @test_mm256_mask_fnmadd_pbh
// CHECK: fneg
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_mask_fnmaddne_pbh(__A, __U, __B, __C);
+ return _mm256_mask_fnmadd_pbh(__A, __U, __B, __C);
}
-__m256bh test_mm256_mask3_fnmaddne_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) {
- // CHECK-LABEL: @test_mm256_mask3_fnmaddne_pbh
+__m256bh test_mm256_mask3_fnmadd_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) {
+ // CHECK-LABEL: @test_mm256_mask3_fnmadd_pbh
// CHECK: fneg
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_mask3_fnmaddne_pbh(__A, __B, __C, __U);
+ return _mm256_mask3_fnmadd_pbh(__A, __B, __C, __U);
}
-__m256bh test_mm256_maskz_fnmaddne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) {
- // CHECK-LABEL: @test_mm256_maskz_fnmaddne_pbh
+__m256bh test_mm256_maskz_fnmadd_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) {
+ // CHECK-LABEL: @test_mm256_maskz_fnmadd_pbh
// CHECK: fneg
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_maskz_fnmaddne_pbh(__U, __A, __B, __C);
+ return _mm256_maskz_fnmadd_pbh(__U, __A, __B, __C);
}
-__m256bh test_mm256_fnmsubne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
- // CHECK-LABEL: @test_mm256_fnmsubne_pbh
+__m256bh test_mm256_fnmsub_pbh(__m256bh __A, __m256bh __B, __m256bh __C) {
+ // CHECK-LABEL: @test_mm256_fnmsub_pbh
// CHECK: fneg
// CHECK: fneg
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
- return _mm256_fnmsubne_pbh(__A, __B, __C);
+ return _mm256_fnmsub_pbh(__A, __B, __C);
}
-__m256bh test_mm256_mask_fnmsubne_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) {
- // CHECK-LABEL: @test_mm256_mask_fnmsubne_pbh
+__m256bh test_mm256_mask_fnmsub_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) {
+ // CHECK-LABEL: @test_mm256_mask_fnmsub_pbh
// CHECK: fneg
// CHECK: fneg
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_mask_fnmsubne_pbh(__A, __U, __B, __C);
+ return _mm256_mask_fnmsub_pbh(__A, __U, __B, __C);
}
-__m256bh test_mm256_mask3_fnmsubne_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) {
- // CHECK-LABEL: @test_mm256_mask3_fnmsubne_pbh
+__m256bh test_mm256_mask3_fnmsub_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) {
+ // CHECK-LABEL: @test_mm256_mask3_fnmsub_pbh
// CHECK: fneg
// CHECK: fneg
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_mask3_fnmsubne_pbh(__A, __B, __C, __U);
+ return _mm256_mask3_fnmsub_pbh(__A, __B, __C, __U);
}
-__m256bh test_mm256_maskz_fnmsubne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) {
- // CHECK-LABEL: @test_mm256_maskz_fnmsubne_pbh
+__m256bh test_mm256_maskz_fnmsub_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) {
+ // CHECK-LABEL: @test_mm256_maskz_fnmsub_pbh
// CHECK: fneg
// CHECK: fneg
// CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}})
// CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}
- return _mm256_maskz_fnmsubne_pbh(__U, __A, __B, __C);
+ return _mm256_maskz_fnmsub_pbh(__U, __A, __B, __C);
}
-__m128bh test_mm_fmaddne_pbh(__m128bh __A, __m128bh __B, __m128bh __C) {
- // CHECK-LABEL: @test_mm_fmaddne_pbh
+__m128bh test_mm_fmadd_pbh(__m128bh __A, __m128bh __B, __m128bh __C) {
+ // CHECK-LABEL: @test_mm_fmadd_pbh
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
- return _mm_fmaddne_pbh(__A, __B, __C);
+ return _mm_fmadd_pbh(__A, __B, __C);
}
-__m128bh test_mm_mask_fmaddne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
- // CHECK-LABEL: @test_mm_mask_fmaddne_pbh
+__m128bh test_mm_mask_fmadd_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
+ // CHECK-LABEL: @test_mm_mask_fmadd_pbh
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_mask_fmaddne_pbh(__A, __U, __B, __C);
+ return _mm_mask_fmadd_pbh(__A, __U, __B, __C);
}
-__m128bh test_mm_mask3_fmaddne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
- // CHECK-LABEL: @test_mm_mask3_fmaddne_pbh
+__m128bh test_mm_mask3_fmadd_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
+ // CHECK-LABEL: @test_mm_mask3_fmadd_pbh
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_mask3_fmaddne_pbh(__A, __B, __C, __U);
+ return _mm_mask3_fmadd_pbh(__A, __B, __C, __U);
}
-__m128bh test_mm_maskz_fmaddne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
- // CHECK-LABEL: @test_mm_maskz_fmaddne_pbh
+__m128bh test_mm_maskz_fmadd_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
+ // CHECK-LABEL: @test_mm_maskz_fmadd_pbh
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_maskz_fmaddne_pbh(__U, __A, __B, __C);
+ return _mm_maskz_fmadd_pbh(__U, __A, __B, __C);
}
-__m128bh test_mm_fmsubne_pbh(__m128bh __A, __m128bh __B, __m128bh __C) {
- // CHECK-LABEL: @test_mm_fmsubne_pbh
+__m128bh test_mm_fmsub_pbh(__m128bh __A, __m128bh __B, __m128bh __C) {
+ // CHECK-LABEL: @test_mm_fmsub_pbh
// CHECK: fneg
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
- return _mm_fmsubne_pbh(__A, __B, __C);
+ return _mm_fmsub_pbh(__A, __B, __C);
}
-__m128bh test_mm_mask_fmsubne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
- // CHECK-LABEL: @test_mm_mask_fmsubne_pbh
+__m128bh test_mm_mask_fmsub_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
+ // CHECK-LABEL: @test_mm_mask_fmsub_pbh
// CHECK: fneg
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_mask_fmsubne_pbh(__A, __U, __B, __C);
+ return _mm_mask_fmsub_pbh(__A, __U, __B, __C);
}
-__m128bh test_mm_mask3_fmsubne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
- // CHECK-LABEL: @test_mm_mask3_fmsubne_pbh
+__m128bh test_mm_mask3_fmsub_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
+ // CHECK-LABEL: @test_mm_mask3_fmsub_pbh
// CHECK: fneg
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_mask3_fmsubne_pbh(__A, __B, __C, __U);
+ return _mm_mask3_fmsub_pbh(__A, __B, __C, __U);
}
-__m128bh test_mm_maskz_fmsubne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
- // CHECK-LABEL: @test_mm_maskz_fmsubne_pbh
+__m128bh test_mm_maskz_fmsub_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
+ // CHECK-LABEL: @test_mm_maskz_fmsub_pbh
// CHECK: fneg
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_maskz_fmsubne_pbh(__U, __A, __B, __C);
+ return _mm_maskz_fmsub_pbh(__U, __A, __B, __C);
}
-__m128bh test_mm_fnmaddne_pbh(__m128bh __A, __m128bh __B, __m128bh __C) {
- // CHECK-LABEL: @test_mm_fnmaddne_pbh
+__m128bh test_mm_fnmadd_pbh(__m128bh __A, __m128bh __B, __m128bh __C) {
+ // CHECK-LABEL: @test_mm_fnmadd_pbh
// CHECK: fneg
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
- return _mm_fnmaddne_pbh(__A, __B, __C);
+ return _mm_fnmadd_pbh(__A, __B, __C);
}
-__m128bh test_mm_mask_fnmaddne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
- // CHECK-LABEL: @test_mm_mask_fnmaddne_pbh
+__m128bh test_mm_mask_fnmadd_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
+ // CHECK-LABEL: @test_mm_mask_fnmadd_pbh
// CHECK: fneg
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_mask_fnmaddne_pbh(__A, __U, __B, __C);
+ return _mm_mask_fnmadd_pbh(__A, __U, __B, __C);
}
-__m128bh test_mm_mask3_fnmaddne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
- // CHECK-LABEL: @test_mm_mask3_fnmaddne_pbh
+__m128bh test_mm_mask3_fnmadd_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
+ // CHECK-LABEL: @test_mm_mask3_fnmadd_pbh
// CHECK: fneg
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_mask3_fnmaddne_pbh(__A, __B, __C, __U);
+ return _mm_mask3_fnmadd_pbh(__A, __B, __C, __U);
}
-__m128bh test_mm_maskz_fnmaddne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
- // CHECK-LABEL: @test_mm_maskz_fnmaddne_pbh
+__m128bh test_mm_maskz_fnmadd_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
+ // CHECK-LABEL: @test_mm_maskz_fnmadd_pbh
// CHECK: fneg
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_maskz_fnmaddne_pbh(__U, __A, __B, __C);
+ return _mm_maskz_fnmadd_pbh(__U, __A, __B, __C);
}
-__m128bh test_mm_fnmsubne_pbh(__m128bh __A, __m128bh __B, __m128bh __C) {
- // CHECK-LABEL: @test_mm_fnmsubne_pbh
+__m128bh test_mm_fnmsub_pbh(__m128bh __A, __m128bh __B, __m128bh __C) {
+ // CHECK-LABEL: @test_mm_fnmsub_pbh
// CHECK: fneg
// CHECK: fneg
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
- return _mm_fnmsubne_pbh(__A, __B, __C);
+ return _mm_fnmsub_pbh(__A, __B, __C);
}
-__m128bh test_mm_mask_fnmsubne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
- // CHECK-LABEL: @test_mm_mask_fnmsubne_pbh
+__m128bh test_mm_mask_fnmsub_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) {
+ // CHECK-LABEL: @test_mm_mask_fnmsub_pbh
// CHECK: fneg
// CHECK: fneg
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_mask_fnmsubne_pbh(__A, __U, __B, __C);
+ return _mm_mask_fnmsub_pbh(__A, __U, __B, __C);
}
-__m128bh test_mm_mask3_fnmsubne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
- // CHECK-LABEL: @test_mm_mask3_fnmsubne_pbh
+__m128bh test_mm_mask3_fnmsub_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) {
+ // CHECK-LABEL: @test_mm_mask3_fnmsub_pbh
// CHECK: fneg
// CHECK: fneg
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_mask3_fnmsubne_pbh(__A, __B, __C, __U);
+ return _mm_mask3_fnmsub_pbh(__A, __B, __C, __U);
}
-__m128bh test_mm_maskz_fnmsubne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
- // CHECK-LABEL: @test_mm_maskz_fnmsubne_pbh
+__m128bh test_mm_maskz_fnmsub_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) {
+ // CHECK-LABEL: @test_mm_maskz_fnmsub_pbh
// CHECK: fneg
// CHECK: fneg
// CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}})
// CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}
- return _mm_maskz_fnmsubne_pbh(__U, __A, __B, __C);
+ return _mm_maskz_fnmsub_pbh(__U, __A, __B, __C);
}
diff --git a/llvm/include/llvm/IR/IntrinsicsX86.td b/llvm/include/llvm/IR/IntrinsicsX86.td
index 42b211e0e1f75a..a258da8b7e49fb 100644
--- a/llvm/include/llvm/IR/IntrinsicsX86.td
+++ b/llvm/include/llvm/IR/IntrinsicsX86.td
@@ -7588,58 +7588,58 @@ def int_x86_avx10_mask_vcvtneph2hf8s512 : ClangBuiltin<"__builtin_ia32_vcvtneph2
//===----------------------------------------------------------------------===//
let TargetPrefix = "x86" in {
-def int_x86_avx10_vaddnepbf16512 : ClangBuiltin<"__builtin_ia32_vaddnepbf16512">,
+def int_x86_avx10_vaddbf16512 : ClangBuiltin<"__builtin_ia32_vaddbf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vaddnepbf16256 : ClangBuiltin<"__builtin_ia32_vaddnepbf16256">,
+def int_x86_avx10_vaddbf16256 : ClangBuiltin<"__builtin_ia32_vaddbf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vaddnepbf16128 : ClangBuiltin<"__builtin_ia32_vaddnepbf16128">,
+def int_x86_avx10_vaddbf16128 : ClangBuiltin<"__builtin_ia32_vaddbf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vsubnepbf16512 : ClangBuiltin<"__builtin_ia32_vsubnepbf16512">,
+def int_x86_avx10_vsubbf16512 : ClangBuiltin<"__builtin_ia32_vsubbf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vsubnepbf16256 : ClangBuiltin<"__builtin_ia32_vsubnepbf16256">,
+def int_x86_avx10_vsubbf16256 : ClangBuiltin<"__builtin_ia32_vsubbf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vsubnepbf16128 : ClangBuiltin<"__builtin_ia32_vsubnepbf16128">,
+def int_x86_avx10_vsubbf16128 : ClangBuiltin<"__builtin_ia32_vsubbf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vmulnepbf16512 : ClangBuiltin<"__builtin_ia32_vmulnepbf16512">,
+def int_x86_avx10_vmulbf16512 : ClangBuiltin<"__builtin_ia32_vmulbf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vmulnepbf16256 : ClangBuiltin<"__builtin_ia32_vmulnepbf16256">,
+def int_x86_avx10_vmulbf16256 : ClangBuiltin<"__builtin_ia32_vmulbf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vmulnepbf16128 : ClangBuiltin<"__builtin_ia32_vmulnepbf16128">,
+def int_x86_avx10_vmulbf16128 : ClangBuiltin<"__builtin_ia32_vmulbf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vdivnepbf16512 : ClangBuiltin<"__builtin_ia32_vdivnepbf16512">,
+def int_x86_avx10_vdivbf16512 : ClangBuiltin<"__builtin_ia32_vdivbf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vdivnepbf16256 : ClangBuiltin<"__builtin_ia32_vdivnepbf16256">,
+def int_x86_avx10_vdivbf16256 : ClangBuiltin<"__builtin_ia32_vdivbf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vdivnepbf16128 : ClangBuiltin<"__builtin_ia32_vdivnepbf16128">,
+def int_x86_avx10_vdivbf16128 : ClangBuiltin<"__builtin_ia32_vdivbf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vmaxpbf16512 : ClangBuiltin<"__builtin_ia32_vmaxpbf16512">,
+def int_x86_avx10_vmaxbf16512 : ClangBuiltin<"__builtin_ia32_vmaxbf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vmaxpbf16256 : ClangBuiltin<"__builtin_ia32_vmaxpbf16256">,
+def int_x86_avx10_vmaxbf16256 : ClangBuiltin<"__builtin_ia32_vmaxbf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vmaxpbf16128 : ClangBuiltin<"__builtin_ia32_vmaxpbf16128">,
+def int_x86_avx10_vmaxbf16128 : ClangBuiltin<"__builtin_ia32_vmaxbf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vminpbf16512 : ClangBuiltin<"__builtin_ia32_vminpbf16512">,
+def int_x86_avx10_vminbf16512 : ClangBuiltin<"__builtin_ia32_vminbf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vminpbf16256 : ClangBuiltin<"__builtin_ia32_vminpbf16256">,
+def int_x86_avx10_vminbf16256 : ClangBuiltin<"__builtin_ia32_vminbf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vminpbf16128 : ClangBuiltin<"__builtin_ia32_vminpbf16128">,
+def int_x86_avx10_vminbf16128 : ClangBuiltin<"__builtin_ia32_vminbf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty],
[IntrNoMem]>;
def int_x86_avx10_vcomsbf16eq : ClangBuiltin<"__builtin_ia32_vcomsbf16eq">,
@@ -7660,181 +7660,181 @@ def int_x86_avx10_vcomsbf16ge : ClangBuiltin<"__builtin_ia32_vcomsbf16ge">,
def int_x86_avx10_vcomsbf16neq : ClangBuiltin<"__builtin_ia32_vcomsbf16neq">,
DefaultAttrsIntrinsic<[llvm_i32_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_mask_rsqrt_nepbf16_128 : ClangBuiltin<"__builtin_ia32_vrsqrtpbf16128_mask">,
+def int_x86_avx10_mask_rsqrt_bf16_128 : ClangBuiltin<"__builtin_ia32_vrsqrtbf16128_mask">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_i8_ty],
[IntrNoMem]>;
-def int_x86_avx10_mask_rsqrt_nepbf16_256 : ClangBuiltin<"__builtin_ia32_vrsqrtpbf16256_mask">,
+def int_x86_avx10_mask_rsqrt_bf16_256 : ClangBuiltin<"__builtin_ia32_vrsqrtbf16256_mask">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_i16_ty],
[IntrNoMem]>;
-def int_x86_avx10_mask_rsqrt_nepbf16_512 : ClangBuiltin<"__builtin_ia32_vrsqrtpbf16512_mask">,
+def int_x86_avx10_mask_rsqrt_bf16_512 : ClangBuiltin<"__builtin_ia32_vrsqrtbf16512_mask">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_i32_ty],
[IntrNoMem]>;
-def int_x86_avx10_mask_rcp_nepbf16_128 : ClangBuiltin<"__builtin_ia32_vrcppbf16128_mask">,
+def int_x86_avx10_mask_rcp_bf16_128 : ClangBuiltin<"__builtin_ia32_vrcpbf16128_mask">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_i8_ty],
[IntrNoMem]>;
-def int_x86_avx10_mask_rcp_nepbf16_256 : ClangBuiltin<"__builtin_ia32_vrcppbf16256_mask">,
+def int_x86_avx10_mask_rcp_bf16_256 : ClangBuiltin<"__builtin_ia32_vrcpbf16256_mask">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_i16_ty],
[IntrNoMem]>;
-def int_x86_avx10_mask_rcp_nepbf16_512 : ClangBuiltin<"__builtin_ia32_vrcppbf16512_mask">,
+def int_x86_avx10_mask_rcp_bf16_512 : ClangBuiltin<"__builtin_ia32_vrcpbf16512_mask">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_i32_ty],
[IntrNoMem]>;
-def int_x86_avx10_mask_reduce_nepbf16_128 : ClangBuiltin<"__builtin_ia32_vreducenepbf16128_mask">,
+def int_x86_avx10_mask_reduce_bf16_128 : ClangBuiltin<"__builtin_ia32_vreducebf16128_mask">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_i32_ty, llvm_v8bf16_ty, llvm_i8_ty],
[IntrNoMem, ImmArg<ArgIndex<1>>]>;
-def int_x86_avx10_mask_reduce_nepbf16_256 : ClangBuiltin<"__builtin_ia32_vreducenepbf16256_mask">,
+def int_x86_avx10_mask_reduce_bf16_256 : ClangBuiltin<"__builtin_ia32_vreducebf16256_mask">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_i32_ty, llvm_v16bf16_ty, llvm_i16_ty],
[IntrNoMem, ImmArg<ArgIndex<1>>]>;
-def int_x86_avx10_mask_reduce_nepbf16_512 : ClangBuiltin<"__builtin_ia32_vreducenepbf16512_mask">,
+def int_x86_avx10_mask_reduce_bf16_512 : ClangBuiltin<"__builtin_ia32_vreducebf16512_mask">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_i32_ty, llvm_v32bf16_ty, llvm_i32_ty],
[IntrNoMem, ImmArg<ArgIndex<1>>]>;
-def int_x86_avx10_fpclass_nepbf16_128 :
+def int_x86_avx10_fpclass_bf16_128 :
DefaultAttrsIntrinsic<[llvm_v8i1_ty], [llvm_v8bf16_ty, llvm_i32_ty],
[IntrNoMem, ImmArg<ArgIndex<1>>]>;
-def int_x86_avx10_fpclass_nepbf16_256 :
+def int_x86_avx10_fpclass_bf16_256 :
DefaultAttrsIntrinsic<[llvm_v16i1_ty], [llvm_v16bf16_ty, llvm_i32_ty],
[IntrNoMem, ImmArg<ArgIndex<1>>]>;
-def int_x86_avx10_fpclass_nepbf16_512 :
+def int_x86_avx10_fpclass_bf16_512 :
DefaultAttrsIntrinsic<[llvm_v32i1_ty], [llvm_v32bf16_ty, llvm_i32_ty],
[IntrNoMem, ImmArg<ArgIndex<1>>]>;
-def int_x86_avx10_mask_getexp_nepbf16_128 : ClangBuiltin<"__builtin_ia32_vgetexppbf16128_mask">,
+def int_x86_avx10_mask_getexp_bf16_128 : ClangBuiltin<"__builtin_ia32_vgetexpbf16128_mask">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_i8_ty],
[IntrNoMem]>;
-def int_x86_avx10_mask_getexp_nepbf16_256 : ClangBuiltin<"__builtin_ia32_vgetexppbf16256_mask">,
+def int_x86_avx10_mask_getexp_bf16_256 : ClangBuiltin<"__builtin_ia32_vgetexpbf16256_mask">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_i16_ty],
[IntrNoMem]>;
-def int_x86_avx10_mask_getexp_nepbf16_512 : ClangBuiltin<"__builtin_ia32_vgetexppbf16512_mask">,
+def int_x86_avx10_mask_getexp_bf16_512 : ClangBuiltin<"__builtin_ia32_vgetexpbf16512_mask">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_i32_ty],
[IntrNoMem]>;
-def int_x86_avx10_mask_getmant_nepbf16_128 : ClangBuiltin<"__builtin_ia32_vgetmantpbf16128_mask">,
+def int_x86_avx10_mask_getmant_bf16_128 : ClangBuiltin<"__builtin_ia32_vgetmantbf16128_mask">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_i32_ty, llvm_v8bf16_ty, llvm_i8_ty],
[IntrNoMem, ImmArg<ArgIndex<1>>]>;
-def int_x86_avx10_mask_getmant_nepbf16_256 : ClangBuiltin<"__builtin_ia32_vgetmantpbf16256_mask">,
+def int_x86_avx10_mask_getmant_bf16_256 : ClangBuiltin<"__builtin_ia32_vgetmantbf16256_mask">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_i32_ty, llvm_v16bf16_ty, llvm_i16_ty],
[IntrNoMem, ImmArg<ArgIndex<1>>]>;
-def int_x86_avx10_mask_getmant_nepbf16_512 : ClangBuiltin<"__builtin_ia32_vgetmantpbf16512_mask">,
+def int_x86_avx10_mask_getmant_bf16_512 : ClangBuiltin<"__builtin_ia32_vgetmantbf16512_mask">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_i32_ty, llvm_v32bf16_ty, llvm_i32_ty],
[IntrNoMem, ImmArg<ArgIndex<1>>]>;
-def int_x86_avx10_mask_rndscale_nepbf16_128 : ClangBuiltin<"__builtin_ia32_vrndscalenepbf16_128_mask">,
+def int_x86_avx10_mask_rndscale_bf16_128 : ClangBuiltin<"__builtin_ia32_vrndscalebf16_128_mask">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_i32_ty, llvm_v8bf16_ty, llvm_i8_ty],
[IntrNoMem, ImmArg<ArgIndex<1>>]>;
-def int_x86_avx10_mask_rndscale_nepbf16_256 : ClangBuiltin<"__builtin_ia32_vrndscalenepbf16_256_mask">,
+def int_x86_avx10_mask_rndscale_bf16_256 : ClangBuiltin<"__builtin_ia32_vrndscalebf16_256_mask">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_i32_ty, llvm_v16bf16_ty, llvm_i16_ty],
[IntrNoMem, ImmArg<ArgIndex<1>>]>;
-def int_x86_avx10_mask_rndscale_nepbf16_512 : ClangBuiltin<"__builtin_ia32_vrndscalenepbf16_mask">,
+def int_x86_avx10_mask_rndscale_bf16_512 : ClangBuiltin<"__builtin_ia32_vrndscalebf16_mask">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_i32_ty, llvm_v32bf16_ty, llvm_i32_ty],
[IntrNoMem, ImmArg<ArgIndex<1>>]>;
-def int_x86_avx10_mask_scalef_nepbf16_128 : ClangBuiltin<"__builtin_ia32_vscalefpbf16128_mask">,
+def int_x86_avx10_mask_scalef_bf16_128 : ClangBuiltin<"__builtin_ia32_vscalefbf16128_mask">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_i8_ty],
[IntrNoMem]>;
-def int_x86_avx10_mask_scalef_nepbf16_256 : ClangBuiltin<"__builtin_ia32_vscalefpbf16256_mask">,
+def int_x86_avx10_mask_scalef_bf16_256 : ClangBuiltin<"__builtin_ia32_vscalefbf16256_mask">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_i16_ty],
[IntrNoMem]>;
-def int_x86_avx10_mask_scalef_nepbf16_512 : ClangBuiltin<"__builtin_ia32_vscalefpbf16512_mask">,
+def int_x86_avx10_mask_scalef_bf16_512 : ClangBuiltin<"__builtin_ia32_vscalefbf16512_mask">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_i32_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfmadd213nepbf16256 : ClangBuiltin<"__builtin_ia32_vfmadd213nepbf16256">,
+def int_x86_avx10_vfmadd213bf16256 : ClangBuiltin<"__builtin_ia32_vfmadd213bf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfmadd213nepbf16128 : ClangBuiltin<"__builtin_ia32_vfmadd213nepbf16128">,
+def int_x86_avx10_vfmadd213bf16128 : ClangBuiltin<"__builtin_ia32_vfmadd213bf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ],
[IntrNoMem]>;
-def int_x86_avx10_vfmadd132nepbf16512 : ClangBuiltin<"__builtin_ia32_vfmadd132nepbf16512">,
+def int_x86_avx10_vfmadd132bf16512 : ClangBuiltin<"__builtin_ia32_vfmadd132bf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfmadd132nepbf16256 : ClangBuiltin<"__builtin_ia32_vfmadd132nepbf16256">,
+def int_x86_avx10_vfmadd132bf16256 : ClangBuiltin<"__builtin_ia32_vfmadd132bf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfmadd132nepbf16128 : ClangBuiltin<"__builtin_ia32_vfmadd132nepbf16128">,
+def int_x86_avx10_vfmadd132bf16128 : ClangBuiltin<"__builtin_ia32_vfmadd132bf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ],
[IntrNoMem]>;
-def int_x86_avx10_vfmadd231nepbf16512 : ClangBuiltin<"__builtin_ia32_vfmadd231nepbf16512">,
+def int_x86_avx10_vfmadd231bf16512 : ClangBuiltin<"__builtin_ia32_vfmadd231bf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfmadd231nepbf16256 : ClangBuiltin<"__builtin_ia32_vfmadd231nepbf16256">,
+def int_x86_avx10_vfmadd231bf16256 : ClangBuiltin<"__builtin_ia32_vfmadd231bf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfmadd231nepbf16128 : ClangBuiltin<"__builtin_ia32_vfmadd231nepbf16128">,
+def int_x86_avx10_vfmadd231bf16128 : ClangBuiltin<"__builtin_ia32_vfmadd231bf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ],
[IntrNoMem]>;
-def int_x86_avx10_vfmsub213nepbf16512 : ClangBuiltin<"__builtin_ia32_vfmsub213nepbf16512">,
+def int_x86_avx10_vfmsub213bf16512 : ClangBuiltin<"__builtin_ia32_vfmsub213bf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfmsub213nepbf16256 : ClangBuiltin<"__builtin_ia32_vfmsub213nepbf16256">,
+def int_x86_avx10_vfmsub213bf16256 : ClangBuiltin<"__builtin_ia32_vfmsub213bf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfmsub213nepbf16128 : ClangBuiltin<"__builtin_ia32_vfmsub213nepbf16128">,
+def int_x86_avx10_vfmsub213bf16128 : ClangBuiltin<"__builtin_ia32_vfmsub213bf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ],
[IntrNoMem]>;
-def int_x86_avx10_vfmsub132nepbf16512 : ClangBuiltin<"__builtin_ia32_vfmsub132nepbf16512">,
+def int_x86_avx10_vfmsub132bf16512 : ClangBuiltin<"__builtin_ia32_vfmsub132bf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfmsub132nepbf16256 : ClangBuiltin<"__builtin_ia32_vfmsub132nepbf16256">,
+def int_x86_avx10_vfmsub132bf16256 : ClangBuiltin<"__builtin_ia32_vfmsub132bf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfmsub132nepbf16128 : ClangBuiltin<"__builtin_ia32_vfmsub132nepbf16128">,
+def int_x86_avx10_vfmsub132bf16128 : ClangBuiltin<"__builtin_ia32_vfmsub132bf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ],
[IntrNoMem]>;
-def int_x86_avx10_vfmsub231nepbf16512 : ClangBuiltin<"__builtin_ia32_vfmsub231nepbf16512">,
+def int_x86_avx10_vfmsub231bf16512 : ClangBuiltin<"__builtin_ia32_vfmsub231bf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfmsub231nepbf16256 : ClangBuiltin<"__builtin_ia32_vfmsub231nepbf16256">,
+def int_x86_avx10_vfmsub231bf16256 : ClangBuiltin<"__builtin_ia32_vfmsub231bf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfmsub231nepbf16128 : ClangBuiltin<"__builtin_ia32_vfmsub231nepbf16128">,
+def int_x86_avx10_vfmsub231bf16128 : ClangBuiltin<"__builtin_ia32_vfmsub231bf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ],
[IntrNoMem]>;
-def int_x86_avx10_vfnmadd213nepbf16512 : ClangBuiltin<"__builtin_ia32_vfnmadd213nepbf16512">,
+def int_x86_avx10_vfnmadd213bf16512 : ClangBuiltin<"__builtin_ia32_vfnmadd213bf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfnmadd213nepbf16256 : ClangBuiltin<"__builtin_ia32_vfnmadd213nepbf16256">,
+def int_x86_avx10_vfnmadd213bf16256 : ClangBuiltin<"__builtin_ia32_vfnmadd213bf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfnmadd213nepbf16128 : ClangBuiltin<"__builtin_ia32_vfnmadd213nepbf16128">,
+def int_x86_avx10_vfnmadd213bf16128 : ClangBuiltin<"__builtin_ia32_vfnmadd213bf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ],
[IntrNoMem]>;
-def int_x86_avx10_vfnmadd132nepbf16512 : ClangBuiltin<"__builtin_ia32_vfnmadd132nepbf16512">,
+def int_x86_avx10_vfnmadd132bf16512 : ClangBuiltin<"__builtin_ia32_vfnmadd132bf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfnmadd132nepbf16256 : ClangBuiltin<"__builtin_ia32_vfnmadd132nepbf16256">,
+def int_x86_avx10_vfnmadd132bf16256 : ClangBuiltin<"__builtin_ia32_vfnmadd132bf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfnmadd132nepbf16128 : ClangBuiltin<"__builtin_ia32_vfnmadd132nepbf16128">,
+def int_x86_avx10_vfnmadd132bf16128 : ClangBuiltin<"__builtin_ia32_vfnmadd132bf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ],
[IntrNoMem]>;
-def int_x86_avx10_vfnmadd231nepbf16512 : ClangBuiltin<"__builtin_ia32_vfnmadd231nepbf16512">,
+def int_x86_avx10_vfnmadd231bf16512 : ClangBuiltin<"__builtin_ia32_vfnmadd231bf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfnmadd231nepbf16256 : ClangBuiltin<"__builtin_ia32_vfnmadd231nepbf16256">,
+def int_x86_avx10_vfnmadd231bf16256 : ClangBuiltin<"__builtin_ia32_vfnmadd231bf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfnmadd231nepbf16128 : ClangBuiltin<"__builtin_ia32_vfnmadd231nepbf16128">,
+def int_x86_avx10_vfnmadd231bf16128 : ClangBuiltin<"__builtin_ia32_vfnmadd231bf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ],
[IntrNoMem]>;
-def int_x86_avx10_vfnmsub213nepbf16512 : ClangBuiltin<"__builtin_ia32_vfnmsub213nepbf16512">,
+def int_x86_avx10_vfnmsub213bf16512 : ClangBuiltin<"__builtin_ia32_vfnmsub213bf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfnmsub213nepbf16256 : ClangBuiltin<"__builtin_ia32_vfnmsub213nepbf16256">,
+def int_x86_avx10_vfnmsub213bf16256 : ClangBuiltin<"__builtin_ia32_vfnmsub213bf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfnmsub213nepbf16128 : ClangBuiltin<"__builtin_ia32_vfnmsub213nepbf16128">,
+def int_x86_avx10_vfnmsub213bf16128 : ClangBuiltin<"__builtin_ia32_vfnmsub213bf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ],
[IntrNoMem]>;
-def int_x86_avx10_vfnmsub132nepbf16512 : ClangBuiltin<"__builtin_ia32_vfnmsub132nepbf16512">,
+def int_x86_avx10_vfnmsub132bf16512 : ClangBuiltin<"__builtin_ia32_vfnmsub132bf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfnmsub132nepbf16256 : ClangBuiltin<"__builtin_ia32_vfnmsub132nepbf16256">,
+def int_x86_avx10_vfnmsub132bf16256 : ClangBuiltin<"__builtin_ia32_vfnmsub132bf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfnmsub132nepbf16128 : ClangBuiltin<"__builtin_ia32_vfnmsub132nepbf16128">,
+def int_x86_avx10_vfnmsub132bf16128 : ClangBuiltin<"__builtin_ia32_vfnmsub132bf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ],
[IntrNoMem]>;
-def int_x86_avx10_vfnmsub231nepbf16512 : ClangBuiltin<"__builtin_ia32_vfnmsub231nepbf16512">,
+def int_x86_avx10_vfnmsub231bf16512 : ClangBuiltin<"__builtin_ia32_vfnmsub231bf16512">,
DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfnmsub231nepbf16256 : ClangBuiltin<"__builtin_ia32_vfnmsub231nepbf16256">,
+def int_x86_avx10_vfnmsub231bf16256 : ClangBuiltin<"__builtin_ia32_vfnmsub231bf16256">,
DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty],
[IntrNoMem]>;
-def int_x86_avx10_vfnmsub231nepbf16128 : ClangBuiltin<"__builtin_ia32_vfnmsub231nepbf16128">,
+def int_x86_avx10_vfnmsub231bf16128 : ClangBuiltin<"__builtin_ia32_vfnmsub231bf16128">,
DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ],
[IntrNoMem]>;
}
@@ -7893,4 +7893,4 @@ def int_x86_movrsdi : ClangBuiltin<"__builtin_ia32_movrsdi">,
[IntrReadMem]>;
def int_x86_prefetchrs : ClangBuiltin<"__builtin_ia32_prefetchrs">,
Intrinsic<[], [llvm_ptr_ty], []>;
-}
\ No newline at end of file
+}
diff --git a/llvm/lib/Target/X86/AsmParser/X86AsmParser.cpp b/llvm/lib/Target/X86/AsmParser/X86AsmParser.cpp
index 41a646621c7ead..a6285a55f41554 100644
--- a/llvm/lib/Target/X86/AsmParser/X86AsmParser.cpp
+++ b/llvm/lib/Target/X86/AsmParser/X86AsmParser.cpp
@@ -3306,11 +3306,11 @@ bool X86AsmParser::parseInstruction(ParseInstructionInfo &Info, StringRef Name,
if ((PatchedName.starts_with("cmp") || PatchedName.starts_with("vcmp")) &&
(PatchedName.ends_with("ss") || PatchedName.ends_with("sd") ||
PatchedName.ends_with("sh") || PatchedName.ends_with("ph") ||
- PatchedName.ends_with("pbf16") || PatchedName.ends_with("ps") ||
+ PatchedName.ends_with("bf16") || PatchedName.ends_with("ps") ||
PatchedName.ends_with("pd"))) {
bool IsVCMP = PatchedName[0] == 'v';
unsigned CCIdx = IsVCMP ? 4 : 3;
- unsigned suffixLength = PatchedName.ends_with("pbf16") ? 5 : 2;
+ unsigned suffixLength = PatchedName.ends_with("bf16") ? 5 : 2;
unsigned CC = StringSwitch<unsigned>(
PatchedName.slice(CCIdx, PatchedName.size() - suffixLength))
.Case("eq", 0x00)
@@ -3375,8 +3375,8 @@ bool X86AsmParser::parseInstruction(ParseInstructionInfo &Info, StringRef Name,
PatchedName = "vcmpsh";
else if (PatchedName.ends_with("ph"))
PatchedName = "vcmpph";
- else if (PatchedName.ends_with("pbf16"))
- PatchedName = "vcmppbf16";
+ else if (PatchedName.ends_with("bf16"))
+ PatchedName = "vcmpbf16";
else
llvm_unreachable("Unexpected suffix!");
diff --git a/llvm/lib/Target/X86/MCTargetDesc/X86ATTInstPrinter.cpp b/llvm/lib/Target/X86/MCTargetDesc/X86ATTInstPrinter.cpp
index abe0cc6365dd4e..cd89b88f461948 100644
--- a/llvm/lib/Target/X86/MCTargetDesc/X86ATTInstPrinter.cpp
+++ b/llvm/lib/Target/X86/MCTargetDesc/X86ATTInstPrinter.cpp
@@ -166,15 +166,15 @@ bool X86ATTInstPrinter::printVecCompareInstr(const MCInst *MI,
case X86::VCMPPHZrmbi: case X86::VCMPPHZrmbik:
case X86::VCMPPHZrrib: case X86::VCMPPHZrribk:
case X86::VCMPSHZrrib_Int: case X86::VCMPSHZrribk_Int:
- case X86::VCMPPBF16Z128rmi: case X86::VCMPPBF16Z128rri:
- case X86::VCMPPBF16Z256rmi: case X86::VCMPPBF16Z256rri:
- case X86::VCMPPBF16Zrmi: case X86::VCMPPBF16Zrri:
- case X86::VCMPPBF16Z128rmik: case X86::VCMPPBF16Z128rrik:
- case X86::VCMPPBF16Z256rmik: case X86::VCMPPBF16Z256rrik:
- case X86::VCMPPBF16Zrmik: case X86::VCMPPBF16Zrrik:
- case X86::VCMPPBF16Z128rmbi: case X86::VCMPPBF16Z128rmbik:
- case X86::VCMPPBF16Z256rmbi: case X86::VCMPPBF16Z256rmbik:
- case X86::VCMPPBF16Zrmbi: case X86::VCMPPBF16Zrmbik:
+ case X86::VCMPBF16Z128rmi: case X86::VCMPBF16Z128rri:
+ case X86::VCMPBF16Z256rmi: case X86::VCMPBF16Z256rri:
+ case X86::VCMPBF16Zrmi: case X86::VCMPBF16Zrri:
+ case X86::VCMPBF16Z128rmik: case X86::VCMPBF16Z128rrik:
+ case X86::VCMPBF16Z256rmik: case X86::VCMPBF16Z256rrik:
+ case X86::VCMPBF16Zrmik: case X86::VCMPBF16Zrrik:
+ case X86::VCMPBF16Z128rmbi: case X86::VCMPBF16Z128rmbik:
+ case X86::VCMPBF16Z256rmbi: case X86::VCMPBF16Z256rmbik:
+ case X86::VCMPBF16Zrmbi: case X86::VCMPBF16Zrmbik:
if (Imm >= 0 && Imm <= 31) {
OS << '\t';
printCMPMnemonic(MI, /*IsVCMP*/true, OS);
diff --git a/llvm/lib/Target/X86/MCTargetDesc/X86InstComments.cpp b/llvm/lib/Target/X86/MCTargetDesc/X86InstComments.cpp
index 681d0dab37d09e..4c26fc86f95471 100644
--- a/llvm/lib/Target/X86/MCTargetDesc/X86InstComments.cpp
+++ b/llvm/lib/Target/X86/MCTargetDesc/X86InstComments.cpp
@@ -979,7 +979,7 @@ static bool printFPCLASSComments(const MCInst *MI, raw_ostream &OS,
unsigned NumOperands = MI->getNumOperands();
int SrcIdx;
switch (MI->getOpcode()) {
- CASE_FPCLASS_PACKED(FPCLASSPBF16, r)
+ CASE_FPCLASS_PACKED(FPCLASSBF16, r)
CASE_FPCLASS_PACKED(FPCLASSPH, r)
CASE_FPCLASS_PACKED(FPCLASSPS, r)
CASE_FPCLASS_PACKED(FPCLASSPD, r)
@@ -989,7 +989,7 @@ static bool printFPCLASSComments(const MCInst *MI, raw_ostream &OS,
SrcIdx = NumOperands - 2;
break;
}
- CASE_FPCLASS_PACKED_MEM(FPCLASSPBF16)
+ CASE_FPCLASS_PACKED_MEM(FPCLASSBF16)
CASE_FPCLASS_PACKED_MEM(FPCLASSPH)
CASE_FPCLASS_PACKED_MEM(FPCLASSPS)
CASE_FPCLASS_PACKED_MEM(FPCLASSPD)
diff --git a/llvm/lib/Target/X86/MCTargetDesc/X86InstPrinterCommon.cpp b/llvm/lib/Target/X86/MCTargetDesc/X86InstPrinterCommon.cpp
index 01e2d4ace97733..8470d26011cd8e 100644
--- a/llvm/lib/Target/X86/MCTargetDesc/X86InstPrinterCommon.cpp
+++ b/llvm/lib/Target/X86/MCTargetDesc/X86InstPrinterCommon.cpp
@@ -309,16 +309,16 @@ void X86InstPrinterCommon::printCMPMnemonic(const MCInst *MI, bool IsVCmp,
case X86::VCMPSHZrmik_Int: case X86::VCMPSHZrrik_Int:
OS << "sh\t";
break;
- case X86::VCMPPBF16Z128rmi: case X86::VCMPPBF16Z128rri:
- case X86::VCMPPBF16Z256rmi: case X86::VCMPPBF16Z256rri:
- case X86::VCMPPBF16Zrmi: case X86::VCMPPBF16Zrri:
- case X86::VCMPPBF16Z128rmik: case X86::VCMPPBF16Z128rrik:
- case X86::VCMPPBF16Z256rmik: case X86::VCMPPBF16Z256rrik:
- case X86::VCMPPBF16Zrmik: case X86::VCMPPBF16Zrrik:
- case X86::VCMPPBF16Z128rmbi: case X86::VCMPPBF16Z128rmbik:
- case X86::VCMPPBF16Z256rmbi: case X86::VCMPPBF16Z256rmbik:
- case X86::VCMPPBF16Zrmbi: case X86::VCMPPBF16Zrmbik:
- OS << "pbf16\t";
+ case X86::VCMPBF16Z128rmi: case X86::VCMPBF16Z128rri:
+ case X86::VCMPBF16Z256rmi: case X86::VCMPBF16Z256rri:
+ case X86::VCMPBF16Zrmi: case X86::VCMPBF16Zrri:
+ case X86::VCMPBF16Z128rmik: case X86::VCMPBF16Z128rrik:
+ case X86::VCMPBF16Z256rmik: case X86::VCMPBF16Z256rrik:
+ case X86::VCMPBF16Zrmik: case X86::VCMPBF16Zrrik:
+ case X86::VCMPBF16Z128rmbi: case X86::VCMPBF16Z128rmbik:
+ case X86::VCMPBF16Z256rmbi: case X86::VCMPBF16Z256rmbik:
+ case X86::VCMPBF16Zrmbi: case X86::VCMPBF16Zrmbik:
+ OS << "bf16\t";
break;
}
}
diff --git a/llvm/lib/Target/X86/MCTargetDesc/X86IntelInstPrinter.cpp b/llvm/lib/Target/X86/MCTargetDesc/X86IntelInstPrinter.cpp
index c26dc2ca5a7a4a..0d92609b3a63d4 100644
--- a/llvm/lib/Target/X86/MCTargetDesc/X86IntelInstPrinter.cpp
+++ b/llvm/lib/Target/X86/MCTargetDesc/X86IntelInstPrinter.cpp
@@ -145,15 +145,15 @@ bool X86IntelInstPrinter::printVecCompareInstr(const MCInst *MI, raw_ostream &OS
case X86::VCMPPHZrmbi: case X86::VCMPPHZrmbik:
case X86::VCMPPHZrrib: case X86::VCMPPHZrribk:
case X86::VCMPSHZrrib_Int: case X86::VCMPSHZrribk_Int:
- case X86::VCMPPBF16Z128rmi: case X86::VCMPPBF16Z128rri:
- case X86::VCMPPBF16Z256rmi: case X86::VCMPPBF16Z256rri:
- case X86::VCMPPBF16Zrmi: case X86::VCMPPBF16Zrri:
- case X86::VCMPPBF16Z128rmik: case X86::VCMPPBF16Z128rrik:
- case X86::VCMPPBF16Z256rmik: case X86::VCMPPBF16Z256rrik:
- case X86::VCMPPBF16Zrmik: case X86::VCMPPBF16Zrrik:
- case X86::VCMPPBF16Z128rmbi: case X86::VCMPPBF16Z128rmbik:
- case X86::VCMPPBF16Z256rmbi: case X86::VCMPPBF16Z256rmbik:
- case X86::VCMPPBF16Zrmbi: case X86::VCMPPBF16Zrmbik:
+ case X86::VCMPBF16Z128rmi: case X86::VCMPBF16Z128rri:
+ case X86::VCMPBF16Z256rmi: case X86::VCMPBF16Z256rri:
+ case X86::VCMPBF16Zrmi: case X86::VCMPBF16Zrri:
+ case X86::VCMPBF16Z128rmik: case X86::VCMPBF16Z128rrik:
+ case X86::VCMPBF16Z256rmik: case X86::VCMPBF16Z256rrik:
+ case X86::VCMPBF16Zrmik: case X86::VCMPBF16Zrrik:
+ case X86::VCMPBF16Z128rmbi: case X86::VCMPBF16Z128rmbik:
+ case X86::VCMPBF16Z256rmbi: case X86::VCMPBF16Z256rmbik:
+ case X86::VCMPBF16Zrmbi: case X86::VCMPBF16Zrmbik:
if (Imm >= 0 && Imm <= 31) {
OS << '\t';
printCMPMnemonic(MI, /*IsVCMP*/true, OS);
diff --git a/llvm/lib/Target/X86/X86InstrAVX10.td b/llvm/lib/Target/X86/X86InstrAVX10.td
index edbcb17297603b..6cc814f6b31f43 100644
--- a/llvm/lib/Target/X86/X86InstrAVX10.td
+++ b/llvm/lib/Target/X86/X86InstrAVX10.td
@@ -1308,31 +1308,31 @@ defm VCVTHF82PH : avx10_convert_2op_nomb<"vcvthf82ph", avx512vl_f16_info,
// AVX10 BF16 instructions
//-------------------------------------------------
-// VADDNEPBF16, VSUBNEPBF16, VMULNEPBF16, VDIVNEPBF16, VMAXPBF16, VMINPBF16
-multiclass avx10_fp_binopne_int_pbf16<bits<8> opc, string OpcodeStr,
+// VADDBF16, VSUBBF16, VMULBF16, VDIVBF16, VMAXBF16, VMINBF16
+multiclass avx10_fp_binopne_int_bf16<bits<8> opc, string OpcodeStr,
X86SchedWriteSizes sched,
bit IsCommutable = 0> {
let Predicates = [HasAVX10_2_512] in
defm Z : avx512_fp_packed<opc, OpcodeStr,
- !cast<Intrinsic>("int_x86_avx10_"#OpcodeStr#"pbf16512"),
- !cast<Intrinsic>("int_x86_avx10_"#OpcodeStr#"pbf16512"),
+ !cast<Intrinsic>("int_x86_avx10_"#OpcodeStr#"bf16512"),
+ !cast<Intrinsic>("int_x86_avx10_"#OpcodeStr#"bf16512"),
v32bf16_info, sched.PH.ZMM, IsCommutable>, EVEX_V512,
T_MAP5, PD, EVEX_CD8<16, CD8VF>;
let Predicates = [HasAVX10_2] in {
defm Z128 : avx512_fp_packed<opc, OpcodeStr,
- !cast<Intrinsic>("int_x86_avx10_"#OpcodeStr#"pbf16128"),
- !cast<Intrinsic>("int_x86_avx10_"#OpcodeStr#"pbf16128"),
+ !cast<Intrinsic>("int_x86_avx10_"#OpcodeStr#"bf16128"),
+ !cast<Intrinsic>("int_x86_avx10_"#OpcodeStr#"bf16128"),
v8bf16x_info, sched.PH.XMM, IsCommutable>, EVEX_V128,
T_MAP5, PD, EVEX_CD8<16, CD8VF>;
defm Z256 : avx512_fp_packed<opc, OpcodeStr,
- !cast<Intrinsic>("int_x86_avx10_"#OpcodeStr#"pbf16256"),
- !cast<Intrinsic>("int_x86_avx10_"#OpcodeStr#"pbf16256"),
+ !cast<Intrinsic>("int_x86_avx10_"#OpcodeStr#"bf16256"),
+ !cast<Intrinsic>("int_x86_avx10_"#OpcodeStr#"bf16256"),
v16bf16x_info, sched.PH.YMM, IsCommutable>, EVEX_V256,
T_MAP5, PD, EVEX_CD8<16, CD8VF>;
}
}
-multiclass avx10_fp_binop_pbf16<bits<8> opc, string OpcodeStr, SDPatternOperator OpNode,
+multiclass avx10_fp_binop_bf16<bits<8> opc, string OpcodeStr, SDPatternOperator OpNode,
X86SchedWriteSizes sched,
bit IsCommutable = 0,
SDPatternOperator MaskOpNode = OpNode> {
@@ -1351,12 +1351,12 @@ multiclass avx10_fp_binop_pbf16<bits<8> opc, string OpcodeStr, SDPatternOperator
}
let Uses = []<Register>, mayRaiseFPException = 0 in {
-defm VADDNEPBF16 : avx10_fp_binop_pbf16<0x58, "vaddne", fadd, SchedWriteFAddSizes, 1>;
-defm VSUBNEPBF16 : avx10_fp_binop_pbf16<0x5C, "vsubne", fsub, SchedWriteFAddSizes, 0>;
-defm VMULNEPBF16 : avx10_fp_binop_pbf16<0x59, "vmulne", fmul, SchedWriteFMulSizes, 1>;
-defm VDIVNEPBF16 : avx10_fp_binop_pbf16<0x5E, "vdivne", fdiv, SchedWriteFDivSizes, 0>;
-defm VMINPBF16 : avx10_fp_binopne_int_pbf16<0x5D, "vmin", SchedWriteFCmpSizes, 0>;
-defm VMAXPBF16 : avx10_fp_binopne_int_pbf16<0x5F, "vmax", SchedWriteFCmpSizes, 0>;
+defm VADDBF16 : avx10_fp_binop_bf16<0x58, "vadd", fadd, SchedWriteFAddSizes, 1>;
+defm VSUBBF16 : avx10_fp_binop_bf16<0x5C, "vsub", fsub, SchedWriteFAddSizes, 0>;
+defm VMULBF16 : avx10_fp_binop_bf16<0x59, "vmul", fmul, SchedWriteFMulSizes, 1>;
+defm VDIVBF16 : avx10_fp_binop_bf16<0x5E, "vdiv", fdiv, SchedWriteFDivSizes, 0>;
+defm VMINBF16 : avx10_fp_binopne_int_bf16<0x5D, "vmin", SchedWriteFCmpSizes, 0>;
+defm VMAXBF16 : avx10_fp_binopne_int_bf16<0x5F, "vmax", SchedWriteFCmpSizes, 0>;
}
// VCOMSBF16
@@ -1375,7 +1375,7 @@ let Uses = []<Register>, mayRaiseFPException = 0,
}
}
-// VCMPPBF16
+// VCMPBF16
multiclass avx10_vcmp_common_bf16<X86FoldableSchedWrite sched, X86VectorVTInfo _> {
let mayRaiseFPException = 0 in {
defm rri : AVX512_maskable_cmp<0xC2, MRMSrcReg, _,
@@ -1421,56 +1421,56 @@ multiclass avx10_vcmp_bf16<X86SchedWriteWidths sched, AVX512VLVectorVTInfo _> {
}
}
-defm VCMPPBF16 : avx10_vcmp_bf16<SchedWriteFCmp, avx512vl_bf16_info>,
+defm VCMPBF16 : avx10_vcmp_bf16<SchedWriteFCmp, avx512vl_bf16_info>,
AVX512XDIi8Base, EVEX, VVVV,
EVEX_CD8<16, CD8VF>, TA;
-// VSQRTNEPBF16
+// VSQRTBF16
multiclass avx10_sqrt_packed_bf16<bits<8> opc, string OpcodeStr,
X86SchedWriteSizes sched> {
let Predicates = [HasAVX10_2_512] in
- defm Z : avx512_sqrt_packed<opc, !strconcat(OpcodeStr, "pbf16"),
+ defm Z : avx512_sqrt_packed<opc, !strconcat(OpcodeStr, "bf16"),
sched.PH.ZMM, v32bf16_info>,
EVEX_V512, PD, T_MAP5, EVEX_CD8<16, CD8VF>;
let Predicates = [HasAVX10_2] in {
- defm Z128 : avx512_sqrt_packed<opc, !strconcat(OpcodeStr, "pbf16"),
+ defm Z128 : avx512_sqrt_packed<opc, !strconcat(OpcodeStr, "bf16"),
sched.PH.XMM, v8bf16x_info>,
EVEX_V128, PD, T_MAP5, EVEX_CD8<16, CD8VF>;
- defm Z256 : avx512_sqrt_packed<opc, !strconcat(OpcodeStr, "pbf16"),
+ defm Z256 : avx512_sqrt_packed<opc, !strconcat(OpcodeStr, "bf16"),
sched.PH.YMM, v16bf16x_info>,
EVEX_V256, PD, T_MAP5, EVEX_CD8<16, CD8VF>;
}
}
let Uses = []<Register>, mayRaiseFPException = 0 in
-defm VSQRTNEPBF16 : avx10_sqrt_packed_bf16<0x51, "vsqrtne", SchedWriteFSqrtSizes>;
+defm VSQRTBF16 : avx10_sqrt_packed_bf16<0x51, "vsqrt", SchedWriteFSqrtSizes>;
-// VRSQRTPBF16, VRCPPBF16, VSRQTPBF16, VGETEXPPBF16
-multiclass avx10_fp14_pbf16<bits<8> opc, string OpcodeStr, SDNode OpNode,
+// VRSQRTBF16, VRCPBF16, VSRQTBF16, VGETEXPBF16
+multiclass avx10_fp14_bf16<bits<8> opc, string OpcodeStr, SDNode OpNode,
X86SchedWriteWidths sched> {
let Predicates = [HasAVX10_2_512] in
- defm PBF16Z : avx512_fp14_p<opc, !strconcat(OpcodeStr, "pbf16"),
- OpNode, sched.ZMM, v32bf16_info>,
- EVEX_V512;
+ defm BF16Z : avx512_fp14_p<opc, !strconcat(OpcodeStr, "bf16"),
+ OpNode, sched.ZMM, v32bf16_info>,
+ EVEX_V512;
let Predicates = [HasAVX10_2] in {
- defm PBF16Z128 : avx512_fp14_p<opc, !strconcat(OpcodeStr, "pbf16"),
- OpNode, sched.XMM, v8bf16x_info>,
- EVEX_V128;
- defm PBF16Z256 : avx512_fp14_p<opc, !strconcat(OpcodeStr, "pbf16"),
- OpNode, sched.YMM, v16bf16x_info>,
- EVEX_V256;
+ defm BF16Z128 : avx512_fp14_p<opc, !strconcat(OpcodeStr, "bf16"),
+ OpNode, sched.XMM, v8bf16x_info>,
+ EVEX_V128;
+ defm BF16Z256 : avx512_fp14_p<opc, !strconcat(OpcodeStr, "bf16"),
+ OpNode, sched.YMM, v16bf16x_info>,
+ EVEX_V256;
}
}
-defm VRSQRT : avx10_fp14_pbf16<0x4E, "vrsqrt", X86rsqrt14, SchedWriteFRsqrt>,
+defm VRSQRT : avx10_fp14_bf16<0x4E, "vrsqrt", X86rsqrt14, SchedWriteFRsqrt>,
T_MAP6, PS, EVEX_CD8<16, CD8VF>;
-defm VRCP : avx10_fp14_pbf16<0x4C, "vrcp", X86rcp14, SchedWriteFRcp>,
+defm VRCP : avx10_fp14_bf16<0x4C, "vrcp", X86rcp14, SchedWriteFRcp>,
T_MAP6, PS, EVEX_CD8<16, CD8VF>;
-defm VGETEXP : avx10_fp14_pbf16<0x42, "vgetexp", X86fgetexp, SchedWriteFRnd>,
+defm VGETEXP : avx10_fp14_bf16<0x42, "vgetexp", X86fgetexp, SchedWriteFRnd>,
T_MAP5, EVEX_CD8<16, CD8VF>;
-// VSCALEFPBF16
+// VSCALEFBF16
multiclass avx10_fp_scalef_bf16<bits<8> opc, string OpcodeStr,
X86SchedWriteWidths sched> {
let Predicates = [HasAVX10_2_512] in
@@ -1485,9 +1485,9 @@ multiclass avx10_fp_scalef_bf16<bits<8> opc, string OpcodeStr,
}
let Uses = []<Register>, mayRaiseFPException = 0 in
-defm VSCALEFPBF16 : avx10_fp_scalef_bf16<0x2C, "vscalef", SchedWriteFAdd>;
+defm VSCALEFBF16 : avx10_fp_scalef_bf16<0x2C, "vscalef", SchedWriteFAdd>;
-// VREDUCENEPBF16, VRNDSCALENEPBF16, VGETMANTPBF16
+// VREDUCEBF16, VRNDSCALEBF16, VGETMANTBF16
multiclass avx10_common_unary_fp_packed_imm_bf16<string OpcodeStr,
AVX512VLVectorVTInfo _, bits<8> opc, SDPatternOperator OpNode,
SDPatternOperator MaskOpNode, X86SchedWriteWidths sched> {
@@ -1503,18 +1503,18 @@ multiclass avx10_common_unary_fp_packed_imm_bf16<string OpcodeStr,
}
let Uses = []<Register>, mayRaiseFPException = 0 in {
-defm VREDUCENEPBF16 : avx10_common_unary_fp_packed_imm_bf16<"vreducene", avx512vl_bf16_info, 0x56,
+defm VREDUCEBF16 : avx10_common_unary_fp_packed_imm_bf16<"vreduce", avx512vl_bf16_info, 0x56,
X86VReduce, X86VReduce, SchedWriteFRnd>,
AVX512XDIi8Base, TA, EVEX, EVEX_CD8<16, CD8VF>;
-defm VRNDSCALENEPBF16 : avx10_common_unary_fp_packed_imm_bf16<"vrndscalene", avx512vl_bf16_info, 0x08,
+defm VRNDSCALEBF16 : avx10_common_unary_fp_packed_imm_bf16<"vrndscale", avx512vl_bf16_info, 0x08,
X86any_VRndScale, X86VRndScale, SchedWriteFRnd>,
AVX512XDIi8Base, TA, EVEX, EVEX_CD8<16, CD8VF>;
-defm VGETMANTPBF16 : avx10_common_unary_fp_packed_imm_bf16<"vgetmant", avx512vl_bf16_info, 0x26,
+defm VGETMANTBF16 : avx10_common_unary_fp_packed_imm_bf16<"vgetmant", avx512vl_bf16_info, 0x26,
X86VGetMant, X86VGetMant, SchedWriteFRnd>,
AVX512XDIi8Base, TA, EVEX, EVEX_CD8<16, CD8VF>;
}
-// VFPCLASSPBF16
+// VFPCLASSBF16
multiclass avx10_fp_fpclass_bf16<string OpcodeStr, bits<8> opcVec,
X86SchedWriteWidths sched> {
let Predicates = [HasAVX10_2_512] in
@@ -1531,13 +1531,13 @@ multiclass avx10_fp_fpclass_bf16<string OpcodeStr, bits<8> opcVec,
}
}
-defm VFPCLASSPBF16 : avx10_fp_fpclass_bf16<"vfpclass", 0x66, SchedWriteFCmp>,
+defm VFPCLASSBF16 : avx10_fp_fpclass_bf16<"vfpclass", 0x66, SchedWriteFCmp>,
AVX512XDIi8Base, TA, EVEX, EVEX_CD8<16, CD8VF>;
-// VF[,N]M[ADD,SUB][132,213,231]NEPBF16
+// VF[,N]M[ADD,SUB][132,213,231]BF16
multiclass avx10_fma3p_213_bf16<bits<8> opc, string OpcodeStr,
- SDPatternOperator OpNode, SDNode MaskOpNode,
- X86SchedWriteWidths sched> {
+ SDPatternOperator OpNode, SDNode MaskOpNode,
+ X86SchedWriteWidths sched> {
let Predicates = [HasAVX10_2_512] in
defm Z : avx512_fma3p_213_rm<opc, OpcodeStr, OpNode, MaskOpNode,
sched.ZMM, v32bf16_info>, EVEX_V512, T_MAP6, PS,
@@ -1553,14 +1553,14 @@ multiclass avx10_fma3p_213_bf16<bits<8> opc, string OpcodeStr,
}
let Uses = []<Register>, mayRaiseFPException = 0 in {
-defm VFMADD213NEPBF16 : avx10_fma3p_213_bf16<0xA8, "vfmadd213nepbf16", any_fma,
- fma, SchedWriteFMA>;
-defm VFMSUB213NEPBF16 : avx10_fma3p_213_bf16<0xAA, "vfmsub213nepbf16", X86any_Fmsub,
- X86Fmsub, SchedWriteFMA>;
-defm VFNMADD213NEPBF16 : avx10_fma3p_213_bf16<0xAC, "vfnmadd213nepbf16", X86any_Fnmadd,
- X86Fnmadd, SchedWriteFMA>;
-defm VFNMSUB213NEPBF16 : avx10_fma3p_213_bf16<0xAE, "vfnmsub213nepbf16", X86any_Fnmsub,
- X86Fnmsub, SchedWriteFMA>;
+defm VFMADD213BF16 : avx10_fma3p_213_bf16<0xA8, "vfmadd213bf16", any_fma,
+ fma, SchedWriteFMA>;
+defm VFMSUB213BF16 : avx10_fma3p_213_bf16<0xAA, "vfmsub213bf16", X86any_Fmsub,
+ X86Fmsub, SchedWriteFMA>;
+defm VFNMADD213BF16 : avx10_fma3p_213_bf16<0xAC, "vfnmadd213bf16", X86any_Fnmadd,
+ X86Fnmadd, SchedWriteFMA>;
+defm VFNMSUB213BF16 : avx10_fma3p_213_bf16<0xAE, "vfnmsub213bf16", X86any_Fnmsub,
+ X86Fnmsub, SchedWriteFMA>;
}
multiclass avx10_fma3p_231_bf16<bits<8> opc, string OpcodeStr,
@@ -1581,14 +1581,14 @@ multiclass avx10_fma3p_231_bf16<bits<8> opc, string OpcodeStr,
}
let Uses = []<Register>, mayRaiseFPException = 0 in {
-defm VFMADD231NEPBF16 : avx10_fma3p_231_bf16<0xB8, "vfmadd231nepbf16", any_fma,
- fma, SchedWriteFMA>;
-defm VFMSUB231NEPBF16 : avx10_fma3p_231_bf16<0xBA, "vfmsub231nepbf16", X86any_Fmsub,
- X86Fmsub, SchedWriteFMA>;
-defm VFNMADD231NEPBF16 : avx10_fma3p_231_bf16<0xBC, "vfnmadd231nepbf16", X86any_Fnmadd,
- X86Fnmadd, SchedWriteFMA>;
-defm VFNMSUB231NEPBF16 : avx10_fma3p_231_bf16<0xBE, "vfnmsub231nepbf16", X86any_Fnmsub,
- X86Fnmsub, SchedWriteFMA>;
+defm VFMADD231BF16 : avx10_fma3p_231_bf16<0xB8, "vfmadd231bf16", any_fma,
+ fma, SchedWriteFMA>;
+defm VFMSUB231BF16 : avx10_fma3p_231_bf16<0xBA, "vfmsub231bf16", X86any_Fmsub,
+ X86Fmsub, SchedWriteFMA>;
+defm VFNMADD231BF16 : avx10_fma3p_231_bf16<0xBC, "vfnmadd231bf16", X86any_Fnmadd,
+ X86Fnmadd, SchedWriteFMA>;
+defm VFNMSUB231BF16 : avx10_fma3p_231_bf16<0xBE, "vfnmsub231bf16", X86any_Fnmsub,
+ X86Fnmsub, SchedWriteFMA>;
}
multiclass avx10_fma3p_132_bf16<bits<8> opc, string OpcodeStr,
@@ -1609,14 +1609,14 @@ multiclass avx10_fma3p_132_bf16<bits<8> opc, string OpcodeStr,
}
let Uses = []<Register>, mayRaiseFPException = 0 in {
-defm VFMADD132NEPBF16 : avx10_fma3p_132_bf16<0x98, "vfmadd132nepbf16", any_fma,
- fma, SchedWriteFMA>;
-defm VFMSUB132NEPBF16 : avx10_fma3p_132_bf16<0x9A, "vfmsub132nepbf16", X86any_Fmsub,
+defm VFMADD132BF16 : avx10_fma3p_132_bf16<0x98, "vfmadd132bf16", any_fma,
+ fma, SchedWriteFMA>;
+defm VFMSUB132BF16 : avx10_fma3p_132_bf16<0x9A, "vfmsub132bf16", X86any_Fmsub,
X86Fmsub, SchedWriteFMA>;
-defm VFNMADD132NEPBF16 : avx10_fma3p_132_bf16<0x9C, "vfnmadd132nepbf16", X86any_Fnmadd,
- X86Fnmadd, SchedWriteFMA>;
-defm VFNMSUB132NEPBF16 : avx10_fma3p_132_bf16<0x9E, "vfnmsub132nepbf16", X86any_Fnmsub,
- X86Fnmsub, SchedWriteFMA>;
+defm VFNMADD132BF16 : avx10_fma3p_132_bf16<0x9C, "vfnmadd132bf16", X86any_Fnmadd,
+ X86Fnmadd, SchedWriteFMA>;
+defm VFNMSUB132BF16 : avx10_fma3p_132_bf16<0x9E, "vfnmsub132bf16", X86any_Fnmsub,
+ X86Fnmsub, SchedWriteFMA>;
}
//-------------------------------------------------
diff --git a/llvm/lib/Target/X86/X86InstrFMA3Info.cpp b/llvm/lib/Target/X86/X86InstrFMA3Info.cpp
index 0da4857d66748c..d0c508d9934c35 100644
--- a/llvm/lib/Target/X86/X86InstrFMA3Info.cpp
+++ b/llvm/lib/Target/X86/X86InstrFMA3Info.cpp
@@ -53,7 +53,7 @@ using namespace llvm;
FMA3GROUP_PACKED_WIDTHS_ALL(Name, PS, Attrs)
#define FMA3GROUP_PACKED_BF16(Name, Attrs) \
- FMA3GROUP_PACKED_WIDTHS_Z(Name, NEPBF16, Attrs)
+ FMA3GROUP_PACKED_WIDTHS_Z(Name, BF16, Attrs)
#define FMA3GROUP_SCALAR_WIDTHS_Z(Name, Suf, Attrs) \
FMA3GROUP(Name, Suf##Zm, Attrs) \
@@ -93,7 +93,7 @@ static const X86InstrFMA3Group Groups[] = {
FMA3GROUP_MASKED(Name, Type##Z##Suf, Attrs)
#define FMA3GROUP_PACKED_AVX512_ALL(Name, Suf, Attrs) \
- FMA3GROUP_PACKED_AVX512_WIDTHS(Name, NEPBF16, Suf, Attrs) \
+ FMA3GROUP_PACKED_AVX512_WIDTHS(Name, BF16, Suf, Attrs) \
FMA3GROUP_PACKED_AVX512_WIDTHS(Name, PD, Suf, Attrs) \
FMA3GROUP_PACKED_AVX512_WIDTHS(Name, PH, Suf, Attrs) \
FMA3GROUP_PACKED_AVX512_WIDTHS(Name, PS, Suf, Attrs)
diff --git a/llvm/lib/Target/X86/X86InstrUtils.td b/llvm/lib/Target/X86/X86InstrUtils.td
index ab171ac79fb377..6aae90b77fbadd 100644
--- a/llvm/lib/Target/X86/X86InstrUtils.td
+++ b/llvm/lib/Target/X86/X86InstrUtils.td
@@ -311,7 +311,7 @@ def v32i16_info : X86VectorVTInfo<32, i16, VR512, "w">;
def v16i32_info : X86VectorVTInfo<16, i32, VR512, "d">;
def v8i64_info : X86VectorVTInfo<8, i64, VR512, "q">;
def v32f16_info : X86VectorVTInfo<32, f16, VR512, "ph">;
-def v32bf16_info: X86VectorVTInfo<32, bf16, VR512, "pbf16">;
+def v32bf16_info: X86VectorVTInfo<32, bf16, VR512, "bf16">;
def v16f32_info : X86VectorVTInfo<16, f32, VR512, "ps">;
def v8f64_info : X86VectorVTInfo<8, f64, VR512, "pd">;
@@ -321,7 +321,7 @@ def v16i16x_info : X86VectorVTInfo<16, i16, VR256X, "w">;
def v8i32x_info : X86VectorVTInfo<8, i32, VR256X, "d">;
def v4i64x_info : X86VectorVTInfo<4, i64, VR256X, "q">;
def v16f16x_info : X86VectorVTInfo<16, f16, VR256X, "ph">;
-def v16bf16x_info: X86VectorVTInfo<16, bf16, VR256X, "pbf16">;
+def v16bf16x_info: X86VectorVTInfo<16, bf16, VR256X, "bf16">;
def v8f32x_info : X86VectorVTInfo<8, f32, VR256X, "ps">;
def v4f64x_info : X86VectorVTInfo<4, f64, VR256X, "pd">;
@@ -330,7 +330,7 @@ def v8i16x_info : X86VectorVTInfo<8, i16, VR128X, "w">;
def v4i32x_info : X86VectorVTInfo<4, i32, VR128X, "d">;
def v2i64x_info : X86VectorVTInfo<2, i64, VR128X, "q">;
def v8f16x_info : X86VectorVTInfo<8, f16, VR128X, "ph">;
-def v8bf16x_info : X86VectorVTInfo<8, bf16, VR128X, "pbf16">;
+def v8bf16x_info : X86VectorVTInfo<8, bf16, VR128X, "bf16">;
def v4f32x_info : X86VectorVTInfo<4, f32, VR128X, "ps">;
def v2f64x_info : X86VectorVTInfo<2, f64, VR128X, "pd">;
diff --git a/llvm/lib/Target/X86/X86IntrinsicsInfo.h b/llvm/lib/Target/X86/X86IntrinsicsInfo.h
index 86fd04046d16a0..91d7d8755be9b9 100644
--- a/llvm/lib/Target/X86/X86IntrinsicsInfo.h
+++ b/llvm/lib/Target/X86/X86IntrinsicsInfo.h
@@ -389,53 +389,53 @@ static const IntrinsicData IntrinsicsWithoutChain[] = {
X86_INTRINSIC_DATA(avx_vpermilvar_ps, INTR_TYPE_2OP, X86ISD::VPERMILPV, 0),
X86_INTRINSIC_DATA(avx_vpermilvar_ps_256, INTR_TYPE_2OP, X86ISD::VPERMILPV,
0),
- X86_INTRINSIC_DATA(avx10_fpclass_nepbf16_128, INTR_TYPE_2OP,
- X86ISD::VFPCLASS, 0),
- X86_INTRINSIC_DATA(avx10_fpclass_nepbf16_256, INTR_TYPE_2OP,
- X86ISD::VFPCLASS, 0),
- X86_INTRINSIC_DATA(avx10_fpclass_nepbf16_512, INTR_TYPE_2OP,
- X86ISD::VFPCLASS, 0),
- X86_INTRINSIC_DATA(avx10_mask_getexp_nepbf16_128, INTR_TYPE_1OP_MASK,
+ X86_INTRINSIC_DATA(avx10_fpclass_bf16_128, INTR_TYPE_2OP, X86ISD::VFPCLASS,
+ 0),
+ X86_INTRINSIC_DATA(avx10_fpclass_bf16_256, INTR_TYPE_2OP, X86ISD::VFPCLASS,
+ 0),
+ X86_INTRINSIC_DATA(avx10_fpclass_bf16_512, INTR_TYPE_2OP, X86ISD::VFPCLASS,
+ 0),
+ X86_INTRINSIC_DATA(avx10_mask_getexp_bf16_128, INTR_TYPE_1OP_MASK,
X86ISD::FGETEXP, 0),
- X86_INTRINSIC_DATA(avx10_mask_getexp_nepbf16_256, INTR_TYPE_1OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_getexp_bf16_256, INTR_TYPE_1OP_MASK,
X86ISD::FGETEXP, 0),
- X86_INTRINSIC_DATA(avx10_mask_getexp_nepbf16_512, INTR_TYPE_1OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_getexp_bf16_512, INTR_TYPE_1OP_MASK,
X86ISD::FGETEXP, 0),
- X86_INTRINSIC_DATA(avx10_mask_getmant_nepbf16_128, INTR_TYPE_2OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_getmant_bf16_128, INTR_TYPE_2OP_MASK,
X86ISD::VGETMANT, 0),
- X86_INTRINSIC_DATA(avx10_mask_getmant_nepbf16_256, INTR_TYPE_2OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_getmant_bf16_256, INTR_TYPE_2OP_MASK,
X86ISD::VGETMANT, 0),
- X86_INTRINSIC_DATA(avx10_mask_getmant_nepbf16_512, INTR_TYPE_2OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_getmant_bf16_512, INTR_TYPE_2OP_MASK,
X86ISD::VGETMANT, 0),
- X86_INTRINSIC_DATA(avx10_mask_rcp_nepbf16_128, INTR_TYPE_1OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_rcp_bf16_128, INTR_TYPE_1OP_MASK,
X86ISD::RCP14, 0),
- X86_INTRINSIC_DATA(avx10_mask_rcp_nepbf16_256, INTR_TYPE_1OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_rcp_bf16_256, INTR_TYPE_1OP_MASK,
X86ISD::RCP14, 0),
- X86_INTRINSIC_DATA(avx10_mask_rcp_nepbf16_512, INTR_TYPE_1OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_rcp_bf16_512, INTR_TYPE_1OP_MASK,
X86ISD::RCP14, 0),
- X86_INTRINSIC_DATA(avx10_mask_reduce_nepbf16_128, INTR_TYPE_2OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_reduce_bf16_128, INTR_TYPE_2OP_MASK,
X86ISD::VREDUCE, 0),
- X86_INTRINSIC_DATA(avx10_mask_reduce_nepbf16_256, INTR_TYPE_2OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_reduce_bf16_256, INTR_TYPE_2OP_MASK,
X86ISD::VREDUCE, 0),
- X86_INTRINSIC_DATA(avx10_mask_reduce_nepbf16_512, INTR_TYPE_2OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_reduce_bf16_512, INTR_TYPE_2OP_MASK,
X86ISD::VREDUCE, 0),
- X86_INTRINSIC_DATA(avx10_mask_rndscale_nepbf16_128, INTR_TYPE_2OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_rndscale_bf16_128, INTR_TYPE_2OP_MASK,
X86ISD::VRNDSCALE, 0),
- X86_INTRINSIC_DATA(avx10_mask_rndscale_nepbf16_256, INTR_TYPE_2OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_rndscale_bf16_256, INTR_TYPE_2OP_MASK,
X86ISD::VRNDSCALE, 0),
- X86_INTRINSIC_DATA(avx10_mask_rndscale_nepbf16_512, INTR_TYPE_2OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_rndscale_bf16_512, INTR_TYPE_2OP_MASK,
X86ISD::VRNDSCALE, 0),
- X86_INTRINSIC_DATA(avx10_mask_rsqrt_nepbf16_128, INTR_TYPE_1OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_rsqrt_bf16_128, INTR_TYPE_1OP_MASK,
X86ISD::RSQRT14, 0),
- X86_INTRINSIC_DATA(avx10_mask_rsqrt_nepbf16_256, INTR_TYPE_1OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_rsqrt_bf16_256, INTR_TYPE_1OP_MASK,
X86ISD::RSQRT14, 0),
- X86_INTRINSIC_DATA(avx10_mask_rsqrt_nepbf16_512, INTR_TYPE_1OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_rsqrt_bf16_512, INTR_TYPE_1OP_MASK,
X86ISD::RSQRT14, 0),
- X86_INTRINSIC_DATA(avx10_mask_scalef_nepbf16_128, INTR_TYPE_2OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_scalef_bf16_128, INTR_TYPE_2OP_MASK,
X86ISD::SCALEF, 0),
- X86_INTRINSIC_DATA(avx10_mask_scalef_nepbf16_256, INTR_TYPE_2OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_scalef_bf16_256, INTR_TYPE_2OP_MASK,
X86ISD::SCALEF, 0),
- X86_INTRINSIC_DATA(avx10_mask_scalef_nepbf16_512, INTR_TYPE_2OP_MASK,
+ X86_INTRINSIC_DATA(avx10_mask_scalef_bf16_512, INTR_TYPE_2OP_MASK,
X86ISD::SCALEF, 0),
X86_INTRINSIC_DATA(avx10_mask_vcmppd256, CMP_MASK_CC, X86ISD::CMPMM,
X86ISD::CMPMM_SAE),
diff --git a/llvm/test/CodeGen/X86/avx10.2-fma-commute.ll b/llvm/test/CodeGen/X86/avx10.2-fma-commute.ll
index c41e03ba637cbe..ab8ac4fbd41932 100644
--- a/llvm/test/CodeGen/X86/avx10.2-fma-commute.ll
+++ b/llvm/test/CodeGen/X86/avx10.2-fma-commute.ll
@@ -4,7 +4,7 @@
define <8 x bfloat> @fma_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) {
; CHECK-LABEL: fma_123_v8bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0
+; CHECK-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z)
ret <8 x bfloat> %a
@@ -13,7 +13,7 @@ define <8 x bfloat> @fma_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloa
define <8 x bfloat> @fma_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) {
; CHECK-LABEL: fma_213_v8bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0
+; CHECK-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %x, <8 x bfloat> %z)
ret <8 x bfloat> %a
@@ -22,7 +22,7 @@ define <8 x bfloat> @fma_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloa
define <8 x bfloat> @fma_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) {
; CHECK-LABEL: fma_231_v8bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd231nepbf16 %xmm1, %xmm2, %xmm0
+; CHECK-NEXT: vfmadd231bf16 %xmm1, %xmm2, %xmm0
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %z, <8 x bfloat> %x)
ret <8 x bfloat> %a
@@ -31,7 +31,7 @@ define <8 x bfloat> @fma_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloa
define <8 x bfloat> @fma_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) {
; CHECK-LABEL: fma_321_v8bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd231nepbf16 %xmm1, %xmm2, %xmm0
+; CHECK-NEXT: vfmadd231bf16 %xmm1, %xmm2, %xmm0
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %y, <8 x bfloat> %x)
ret <8 x bfloat> %a
@@ -40,7 +40,7 @@ define <8 x bfloat> @fma_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloa
define <8 x bfloat> @fma_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) {
; CHECK-LABEL: fma_132_v8bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 %xmm1, %xmm2, %xmm0
+; CHECK-NEXT: vfmadd213bf16 %xmm1, %xmm2, %xmm0
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %z, <8 x bfloat> %y)
ret <8 x bfloat> %a
@@ -49,7 +49,7 @@ define <8 x bfloat> @fma_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloa
define <8 x bfloat> @fma_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) {
; CHECK-LABEL: fma_312_v8bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 %xmm1, %xmm2, %xmm0
+; CHECK-NEXT: vfmadd213bf16 %xmm1, %xmm2, %xmm0
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %x, <8 x bfloat> %y)
ret <8 x bfloat> %a
@@ -58,7 +58,7 @@ define <8 x bfloat> @fma_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloa
define <8 x bfloat> @fma_load_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_123_v8bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %xmm1, %xmm0
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %xmm1, %xmm0
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z)
@@ -68,7 +68,7 @@ define <8 x bfloat> @fma_load_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %
define <8 x bfloat> @fma_load_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_213_v8bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %xmm1, %xmm0
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %xmm1, %xmm0
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %x, <8 x bfloat> %z)
@@ -78,7 +78,7 @@ define <8 x bfloat> @fma_load_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %
define <8 x bfloat> @fma_load_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_231_v8bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %xmm1, %xmm0
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %xmm1, %xmm0
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %z, <8 x bfloat> %x)
@@ -88,7 +88,7 @@ define <8 x bfloat> @fma_load_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %
define <8 x bfloat> @fma_load_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_321_v8bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %xmm1, %xmm0
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %xmm1, %xmm0
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %y, <8 x bfloat> %x)
@@ -98,7 +98,7 @@ define <8 x bfloat> @fma_load_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %
define <8 x bfloat> @fma_load_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_132_v8bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %xmm1, %xmm0
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %xmm1, %xmm0
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %z, <8 x bfloat> %y)
@@ -108,7 +108,7 @@ define <8 x bfloat> @fma_load_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %
define <8 x bfloat> @fma_load_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_312_v8bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %xmm1, %xmm0
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %xmm1, %xmm0
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %x, <8 x bfloat> %y)
@@ -119,7 +119,7 @@ define <8 x bfloat> @fma_mask_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x
; CHECK-LABEL: fma_mask_123_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 %xmm1, %xmm2, %xmm0 {%k1}
+; CHECK-NEXT: vfmadd132bf16 %xmm1, %xmm2, %xmm0 {%k1}
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z)
%b = bitcast i8 %mask to <8 x i1>
@@ -131,7 +131,7 @@ define <8 x bfloat> @fma_mask_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x
; CHECK-LABEL: fma_mask_213_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0 {%k1}
+; CHECK-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0 {%k1}
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %x, <8 x bfloat> %z)
%b = bitcast i8 %mask to <8 x i1>
@@ -143,7 +143,7 @@ define <8 x bfloat> @fma_mask_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x
; CHECK-LABEL: fma_mask_231_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 %xmm2, %xmm1, %xmm0 {%k1}
+; CHECK-NEXT: vfmadd231bf16 %xmm2, %xmm1, %xmm0 {%k1}
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %z, <8 x bfloat> %x)
%b = bitcast i8 %mask to <8 x i1>
@@ -155,7 +155,7 @@ define <8 x bfloat> @fma_mask_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x
; CHECK-LABEL: fma_mask_321_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 %xmm1, %xmm2, %xmm0 {%k1}
+; CHECK-NEXT: vfmadd231bf16 %xmm1, %xmm2, %xmm0 {%k1}
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %y, <8 x bfloat> %x)
%b = bitcast i8 %mask to <8 x i1>
@@ -167,7 +167,7 @@ define <8 x bfloat> @fma_mask_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x
; CHECK-LABEL: fma_mask_132_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 %xmm2, %xmm1, %xmm0 {%k1}
+; CHECK-NEXT: vfmadd132bf16 %xmm2, %xmm1, %xmm0 {%k1}
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %z, <8 x bfloat> %y)
%b = bitcast i8 %mask to <8 x i1>
@@ -179,7 +179,7 @@ define <8 x bfloat> @fma_mask_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x
; CHECK-LABEL: fma_mask_312_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %xmm1, %xmm2, %xmm0 {%k1}
+; CHECK-NEXT: vfmadd213bf16 %xmm1, %xmm2, %xmm0 {%k1}
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %x, <8 x bfloat> %y)
%b = bitcast i8 %mask to <8 x i1>
@@ -191,7 +191,7 @@ define <8 x bfloat> @fma_maskz_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x
; CHECK-LABEL: fma_maskz_123_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z)
%b = bitcast i8 %mask to <8 x i1>
@@ -203,7 +203,7 @@ define <8 x bfloat> @fma_maskz_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x
; CHECK-LABEL: fma_maskz_213_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %x, <8 x bfloat> %z)
%b = bitcast i8 %mask to <8 x i1>
@@ -215,7 +215,7 @@ define <8 x bfloat> @fma_maskz_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x
; CHECK-LABEL: fma_maskz_231_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 %xmm1, %xmm2, %xmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd231bf16 %xmm1, %xmm2, %xmm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %z, <8 x bfloat> %x)
%b = bitcast i8 %mask to <8 x i1>
@@ -227,7 +227,7 @@ define <8 x bfloat> @fma_maskz_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x
; CHECK-LABEL: fma_maskz_321_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 %xmm1, %xmm2, %xmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd231bf16 %xmm1, %xmm2, %xmm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %y, <8 x bfloat> %x)
%b = bitcast i8 %mask to <8 x i1>
@@ -239,7 +239,7 @@ define <8 x bfloat> @fma_maskz_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x
; CHECK-LABEL: fma_maskz_132_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %xmm1, %xmm2, %xmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 %xmm1, %xmm2, %xmm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %z, <8 x bfloat> %y)
%b = bitcast i8 %mask to <8 x i1>
@@ -251,7 +251,7 @@ define <8 x bfloat> @fma_maskz_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x
; CHECK-LABEL: fma_maskz_312_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %xmm1, %xmm2, %xmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 %xmm1, %xmm2, %xmm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %x, <8 x bfloat> %y)
%b = bitcast i8 %mask to <8 x i1>
@@ -263,7 +263,7 @@ define <8 x bfloat> @fma_mask_load_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y,
; CHECK-LABEL: fma_mask_load_123_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %xmm1, %xmm0 {%k1}
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %xmm1, %xmm0 {%k1}
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z)
@@ -276,7 +276,7 @@ define <8 x bfloat> @fma_mask_load_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y,
; CHECK-LABEL: fma_mask_load_213_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %xmm1, %xmm0 {%k1}
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %xmm1, %xmm0 {%k1}
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %x, <8 x bfloat> %z)
@@ -289,7 +289,7 @@ define <8 x bfloat> @fma_mask_load_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y,
; CHECK-LABEL: fma_mask_load_231_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %xmm1, %xmm0 {%k1}
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %xmm1, %xmm0 {%k1}
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %z, <8 x bfloat> %x)
@@ -302,7 +302,7 @@ define <8 x bfloat> @fma_mask_load_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y,
; CHECK-LABEL: fma_mask_load_321_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %xmm1, %xmm0 {%k1}
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %xmm1, %xmm0 {%k1}
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %y, <8 x bfloat> %x)
@@ -315,7 +315,7 @@ define <8 x bfloat> @fma_mask_load_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y,
; CHECK-LABEL: fma_mask_load_132_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %xmm1, %xmm0 {%k1}
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %xmm1, %xmm0 {%k1}
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %z, <8 x bfloat> %y)
@@ -328,7 +328,7 @@ define <8 x bfloat> @fma_mask_load_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y,
; CHECK-LABEL: fma_mask_load_312_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %xmm1, %xmm0 {%k1}
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %xmm1, %xmm0 {%k1}
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %x, <8 x bfloat> %y)
@@ -341,7 +341,7 @@ define <8 x bfloat> @fma_maskz_load_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y,
; CHECK-LABEL: fma_maskz_load_123_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %xmm1, %xmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %xmm1, %xmm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z)
@@ -354,7 +354,7 @@ define <8 x bfloat> @fma_maskz_load_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y,
; CHECK-LABEL: fma_maskz_load_213_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %xmm1, %xmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %xmm1, %xmm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %x, <8 x bfloat> %z)
@@ -367,7 +367,7 @@ define <8 x bfloat> @fma_maskz_load_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y,
; CHECK-LABEL: fma_maskz_load_231_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %xmm1, %xmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %xmm1, %xmm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %z, <8 x bfloat> %x)
@@ -380,7 +380,7 @@ define <8 x bfloat> @fma_maskz_load_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y,
; CHECK-LABEL: fma_maskz_load_321_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %xmm1, %xmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %xmm1, %xmm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %y, <8 x bfloat> %x)
@@ -393,7 +393,7 @@ define <8 x bfloat> @fma_maskz_load_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y,
; CHECK-LABEL: fma_maskz_load_132_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %xmm1, %xmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %xmm1, %xmm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %z, <8 x bfloat> %y)
@@ -406,7 +406,7 @@ define <8 x bfloat> @fma_maskz_load_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y,
; CHECK-LABEL: fma_maskz_load_312_v8bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %xmm1, %xmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %xmm1, %xmm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <8 x bfloat>, ptr %zp
%a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %x, <8 x bfloat> %y)
@@ -418,7 +418,7 @@ define <8 x bfloat> @fma_maskz_load_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y,
define <16 x bfloat> @fma_123_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) {
; CHECK-LABEL: fma_123_v16bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0
+; CHECK-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z)
ret <16 x bfloat> %a
@@ -427,7 +427,7 @@ define <16 x bfloat> @fma_123_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x
define <16 x bfloat> @fma_213_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) {
; CHECK-LABEL: fma_213_v16bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0
+; CHECK-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %x, <16 x bfloat> %z)
ret <16 x bfloat> %a
@@ -436,7 +436,7 @@ define <16 x bfloat> @fma_213_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x
define <16 x bfloat> @fma_231_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) {
; CHECK-LABEL: fma_231_v16bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd231nepbf16 %ymm1, %ymm2, %ymm0
+; CHECK-NEXT: vfmadd231bf16 %ymm1, %ymm2, %ymm0
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %z, <16 x bfloat> %x)
ret <16 x bfloat> %a
@@ -445,7 +445,7 @@ define <16 x bfloat> @fma_231_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x
define <16 x bfloat> @fma_321_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) {
; CHECK-LABEL: fma_321_v16bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd231nepbf16 %ymm1, %ymm2, %ymm0
+; CHECK-NEXT: vfmadd231bf16 %ymm1, %ymm2, %ymm0
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %y, <16 x bfloat> %x)
ret <16 x bfloat> %a
@@ -454,7 +454,7 @@ define <16 x bfloat> @fma_321_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x
define <16 x bfloat> @fma_132_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) {
; CHECK-LABEL: fma_132_v16bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 %ymm1, %ymm2, %ymm0
+; CHECK-NEXT: vfmadd213bf16 %ymm1, %ymm2, %ymm0
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %z, <16 x bfloat> %y)
ret <16 x bfloat> %a
@@ -463,7 +463,7 @@ define <16 x bfloat> @fma_132_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x
define <16 x bfloat> @fma_312_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) {
; CHECK-LABEL: fma_312_v16bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 %ymm1, %ymm2, %ymm0
+; CHECK-NEXT: vfmadd213bf16 %ymm1, %ymm2, %ymm0
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %x, <16 x bfloat> %y)
ret <16 x bfloat> %a
@@ -472,7 +472,7 @@ define <16 x bfloat> @fma_312_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x
define <16 x bfloat> @fma_load_123_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_123_v16bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %ymm1, %ymm0
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %ymm1, %ymm0
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z)
@@ -482,7 +482,7 @@ define <16 x bfloat> @fma_load_123_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, p
define <16 x bfloat> @fma_load_213_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_213_v16bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %ymm1, %ymm0
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %ymm1, %ymm0
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %x, <16 x bfloat> %z)
@@ -492,7 +492,7 @@ define <16 x bfloat> @fma_load_213_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, p
define <16 x bfloat> @fma_load_231_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_231_v16bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %ymm1, %ymm0
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %ymm1, %ymm0
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %z, <16 x bfloat> %x)
@@ -502,7 +502,7 @@ define <16 x bfloat> @fma_load_231_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, p
define <16 x bfloat> @fma_load_321_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_321_v16bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %ymm1, %ymm0
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %ymm1, %ymm0
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %y, <16 x bfloat> %x)
@@ -512,7 +512,7 @@ define <16 x bfloat> @fma_load_321_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, p
define <16 x bfloat> @fma_load_132_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_132_v16bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %ymm1, %ymm0
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %ymm1, %ymm0
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %z, <16 x bfloat> %y)
@@ -522,7 +522,7 @@ define <16 x bfloat> @fma_load_132_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, p
define <16 x bfloat> @fma_load_312_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_312_v16bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %ymm1, %ymm0
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %ymm1, %ymm0
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %x, <16 x bfloat> %y)
@@ -533,7 +533,7 @@ define <16 x bfloat> @fma_mask_123_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <
; CHECK-LABEL: fma_mask_123_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 %ymm1, %ymm2, %ymm0 {%k1}
+; CHECK-NEXT: vfmadd132bf16 %ymm1, %ymm2, %ymm0 {%k1}
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z)
%b = bitcast i16 %mask to <16 x i1>
@@ -545,7 +545,7 @@ define <16 x bfloat> @fma_mask_213_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <
; CHECK-LABEL: fma_mask_213_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0 {%k1}
+; CHECK-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0 {%k1}
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %x, <16 x bfloat> %z)
%b = bitcast i16 %mask to <16 x i1>
@@ -557,7 +557,7 @@ define <16 x bfloat> @fma_mask_231_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <
; CHECK-LABEL: fma_mask_231_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 %ymm2, %ymm1, %ymm0 {%k1}
+; CHECK-NEXT: vfmadd231bf16 %ymm2, %ymm1, %ymm0 {%k1}
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %z, <16 x bfloat> %x)
%b = bitcast i16 %mask to <16 x i1>
@@ -569,7 +569,7 @@ define <16 x bfloat> @fma_mask_321_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <
; CHECK-LABEL: fma_mask_321_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 %ymm1, %ymm2, %ymm0 {%k1}
+; CHECK-NEXT: vfmadd231bf16 %ymm1, %ymm2, %ymm0 {%k1}
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %y, <16 x bfloat> %x)
%b = bitcast i16 %mask to <16 x i1>
@@ -581,7 +581,7 @@ define <16 x bfloat> @fma_mask_132_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <
; CHECK-LABEL: fma_mask_132_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 %ymm2, %ymm1, %ymm0 {%k1}
+; CHECK-NEXT: vfmadd132bf16 %ymm2, %ymm1, %ymm0 {%k1}
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %z, <16 x bfloat> %y)
%b = bitcast i16 %mask to <16 x i1>
@@ -593,7 +593,7 @@ define <16 x bfloat> @fma_mask_312_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <
; CHECK-LABEL: fma_mask_312_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %ymm1, %ymm2, %ymm0 {%k1}
+; CHECK-NEXT: vfmadd213bf16 %ymm1, %ymm2, %ymm0 {%k1}
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %x, <16 x bfloat> %y)
%b = bitcast i16 %mask to <16 x i1>
@@ -605,7 +605,7 @@ define <16 x bfloat> @fma_maskz_123_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y,
; CHECK-LABEL: fma_maskz_123_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z)
%b = bitcast i16 %mask to <16 x i1>
@@ -617,7 +617,7 @@ define <16 x bfloat> @fma_maskz_213_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y,
; CHECK-LABEL: fma_maskz_213_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %x, <16 x bfloat> %z)
%b = bitcast i16 %mask to <16 x i1>
@@ -629,7 +629,7 @@ define <16 x bfloat> @fma_maskz_231_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y,
; CHECK-LABEL: fma_maskz_231_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 %ymm1, %ymm2, %ymm0 {%k1} {z}
+; CHECK-NEXT: vfmadd231bf16 %ymm1, %ymm2, %ymm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %z, <16 x bfloat> %x)
%b = bitcast i16 %mask to <16 x i1>
@@ -641,7 +641,7 @@ define <16 x bfloat> @fma_maskz_321_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y,
; CHECK-LABEL: fma_maskz_321_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 %ymm1, %ymm2, %ymm0 {%k1} {z}
+; CHECK-NEXT: vfmadd231bf16 %ymm1, %ymm2, %ymm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %y, <16 x bfloat> %x)
%b = bitcast i16 %mask to <16 x i1>
@@ -653,7 +653,7 @@ define <16 x bfloat> @fma_maskz_132_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y,
; CHECK-LABEL: fma_maskz_132_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %ymm1, %ymm2, %ymm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 %ymm1, %ymm2, %ymm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %z, <16 x bfloat> %y)
%b = bitcast i16 %mask to <16 x i1>
@@ -665,7 +665,7 @@ define <16 x bfloat> @fma_maskz_312_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y,
; CHECK-LABEL: fma_maskz_312_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %ymm1, %ymm2, %ymm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 %ymm1, %ymm2, %ymm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %x, <16 x bfloat> %y)
%b = bitcast i16 %mask to <16 x i1>
@@ -677,7 +677,7 @@ define <16 x bfloat> @fma_mask_load_123_v16bf16(<16 x bfloat> %x, <16 x bfloat>
; CHECK-LABEL: fma_mask_load_123_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %ymm1, %ymm0 {%k1}
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %ymm1, %ymm0 {%k1}
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z)
@@ -690,7 +690,7 @@ define <16 x bfloat> @fma_mask_load_213_v16bf16(<16 x bfloat> %x, <16 x bfloat>
; CHECK-LABEL: fma_mask_load_213_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %ymm1, %ymm0 {%k1}
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %ymm1, %ymm0 {%k1}
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %x, <16 x bfloat> %z)
@@ -703,7 +703,7 @@ define <16 x bfloat> @fma_mask_load_231_v16bf16(<16 x bfloat> %x, <16 x bfloat>
; CHECK-LABEL: fma_mask_load_231_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %ymm1, %ymm0 {%k1}
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %ymm1, %ymm0 {%k1}
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %z, <16 x bfloat> %x)
@@ -716,7 +716,7 @@ define <16 x bfloat> @fma_mask_load_321_v16bf16(<16 x bfloat> %x, <16 x bfloat>
; CHECK-LABEL: fma_mask_load_321_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %ymm1, %ymm0 {%k1}
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %ymm1, %ymm0 {%k1}
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %y, <16 x bfloat> %x)
@@ -729,7 +729,7 @@ define <16 x bfloat> @fma_mask_load_132_v16bf16(<16 x bfloat> %x, <16 x bfloat>
; CHECK-LABEL: fma_mask_load_132_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %ymm1, %ymm0 {%k1}
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %ymm1, %ymm0 {%k1}
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %z, <16 x bfloat> %y)
@@ -742,7 +742,7 @@ define <16 x bfloat> @fma_mask_load_312_v16bf16(<16 x bfloat> %x, <16 x bfloat>
; CHECK-LABEL: fma_mask_load_312_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %ymm1, %ymm0 {%k1}
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %ymm1, %ymm0 {%k1}
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %x, <16 x bfloat> %y)
@@ -755,7 +755,7 @@ define <16 x bfloat> @fma_maskz_load_123_v16bf16(<16 x bfloat> %x, <16 x bfloat>
; CHECK-LABEL: fma_maskz_load_123_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %ymm1, %ymm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %ymm1, %ymm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z)
@@ -768,7 +768,7 @@ define <16 x bfloat> @fma_maskz_load_213_v16bf16(<16 x bfloat> %x, <16 x bfloat>
; CHECK-LABEL: fma_maskz_load_213_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %ymm1, %ymm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %ymm1, %ymm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %x, <16 x bfloat> %z)
@@ -781,7 +781,7 @@ define <16 x bfloat> @fma_maskz_load_231_v16bf16(<16 x bfloat> %x, <16 x bfloat>
; CHECK-LABEL: fma_maskz_load_231_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %ymm1, %ymm0 {%k1} {z}
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %ymm1, %ymm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %z, <16 x bfloat> %x)
@@ -794,7 +794,7 @@ define <16 x bfloat> @fma_maskz_load_321_v16bf16(<16 x bfloat> %x, <16 x bfloat>
; CHECK-LABEL: fma_maskz_load_321_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %ymm1, %ymm0 {%k1} {z}
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %ymm1, %ymm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %y, <16 x bfloat> %x)
@@ -807,7 +807,7 @@ define <16 x bfloat> @fma_maskz_load_132_v16bf16(<16 x bfloat> %x, <16 x bfloat>
; CHECK-LABEL: fma_maskz_load_132_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %ymm1, %ymm0 {%k1} {z}
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %ymm1, %ymm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %z, <16 x bfloat> %y)
@@ -820,7 +820,7 @@ define <16 x bfloat> @fma_maskz_load_312_v16bf16(<16 x bfloat> %x, <16 x bfloat>
; CHECK-LABEL: fma_maskz_load_312_v16bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %ymm1, %ymm0 {%k1} {z}
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %ymm1, %ymm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <16 x bfloat>, ptr %zp
%a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %x, <16 x bfloat> %y)
@@ -832,7 +832,7 @@ define <16 x bfloat> @fma_maskz_load_312_v16bf16(<16 x bfloat> %x, <16 x bfloat>
define <32 x bfloat> @fma_123_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) {
; CHECK-LABEL: fma_123_v32bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0
+; CHECK-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z)
ret <32 x bfloat> %a
@@ -841,7 +841,7 @@ define <32 x bfloat> @fma_123_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x
define <32 x bfloat> @fma_213_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) {
; CHECK-LABEL: fma_213_v32bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0
+; CHECK-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %x, <32 x bfloat> %z)
ret <32 x bfloat> %a
@@ -850,7 +850,7 @@ define <32 x bfloat> @fma_213_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x
define <32 x bfloat> @fma_231_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) {
; CHECK-LABEL: fma_231_v32bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd231nepbf16 %zmm1, %zmm2, %zmm0
+; CHECK-NEXT: vfmadd231bf16 %zmm1, %zmm2, %zmm0
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %z, <32 x bfloat> %x)
ret <32 x bfloat> %a
@@ -859,7 +859,7 @@ define <32 x bfloat> @fma_231_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x
define <32 x bfloat> @fma_321_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) {
; CHECK-LABEL: fma_321_v32bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd231nepbf16 %zmm1, %zmm2, %zmm0
+; CHECK-NEXT: vfmadd231bf16 %zmm1, %zmm2, %zmm0
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %y, <32 x bfloat> %x)
ret <32 x bfloat> %a
@@ -868,7 +868,7 @@ define <32 x bfloat> @fma_321_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x
define <32 x bfloat> @fma_132_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) {
; CHECK-LABEL: fma_132_v32bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 %zmm1, %zmm2, %zmm0
+; CHECK-NEXT: vfmadd213bf16 %zmm1, %zmm2, %zmm0
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %z, <32 x bfloat> %y)
ret <32 x bfloat> %a
@@ -877,7 +877,7 @@ define <32 x bfloat> @fma_132_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x
define <32 x bfloat> @fma_312_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) {
; CHECK-LABEL: fma_312_v32bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 %zmm1, %zmm2, %zmm0
+; CHECK-NEXT: vfmadd213bf16 %zmm1, %zmm2, %zmm0
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %x, <32 x bfloat> %y)
ret <32 x bfloat> %a
@@ -886,7 +886,7 @@ define <32 x bfloat> @fma_312_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x
define <32 x bfloat> @fma_load_123_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_123_v32bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %zmm1, %zmm0
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %zmm1, %zmm0
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z)
@@ -896,7 +896,7 @@ define <32 x bfloat> @fma_load_123_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, p
define <32 x bfloat> @fma_load_213_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_213_v32bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %zmm1, %zmm0
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %zmm1, %zmm0
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %x, <32 x bfloat> %z)
@@ -906,7 +906,7 @@ define <32 x bfloat> @fma_load_213_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, p
define <32 x bfloat> @fma_load_231_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_231_v32bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %zmm1, %zmm0
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %zmm1, %zmm0
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %z, <32 x bfloat> %x)
@@ -916,7 +916,7 @@ define <32 x bfloat> @fma_load_231_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, p
define <32 x bfloat> @fma_load_321_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_321_v32bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %zmm1, %zmm0
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %zmm1, %zmm0
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %y, <32 x bfloat> %x)
@@ -926,7 +926,7 @@ define <32 x bfloat> @fma_load_321_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, p
define <32 x bfloat> @fma_load_132_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_132_v32bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %zmm1, %zmm0
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %zmm1, %zmm0
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %z, <32 x bfloat> %y)
@@ -936,7 +936,7 @@ define <32 x bfloat> @fma_load_132_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, p
define <32 x bfloat> @fma_load_312_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ptr %zp) {
; CHECK-LABEL: fma_load_312_v32bf16:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %zmm1, %zmm0
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %zmm1, %zmm0
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %x, <32 x bfloat> %y)
@@ -947,7 +947,7 @@ define <32 x bfloat> @fma_mask_123_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <
; CHECK-LABEL: fma_mask_123_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 %zmm1, %zmm2, %zmm0 {%k1}
+; CHECK-NEXT: vfmadd132bf16 %zmm1, %zmm2, %zmm0 {%k1}
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z)
%b = bitcast i32 %mask to <32 x i1>
@@ -959,7 +959,7 @@ define <32 x bfloat> @fma_mask_213_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <
; CHECK-LABEL: fma_mask_213_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0 {%k1}
+; CHECK-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0 {%k1}
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %x, <32 x bfloat> %z)
%b = bitcast i32 %mask to <32 x i1>
@@ -971,7 +971,7 @@ define <32 x bfloat> @fma_mask_231_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <
; CHECK-LABEL: fma_mask_231_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 %zmm2, %zmm1, %zmm0 {%k1}
+; CHECK-NEXT: vfmadd231bf16 %zmm2, %zmm1, %zmm0 {%k1}
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %z, <32 x bfloat> %x)
%b = bitcast i32 %mask to <32 x i1>
@@ -983,7 +983,7 @@ define <32 x bfloat> @fma_mask_321_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <
; CHECK-LABEL: fma_mask_321_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 %zmm1, %zmm2, %zmm0 {%k1}
+; CHECK-NEXT: vfmadd231bf16 %zmm1, %zmm2, %zmm0 {%k1}
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %y, <32 x bfloat> %x)
%b = bitcast i32 %mask to <32 x i1>
@@ -995,7 +995,7 @@ define <32 x bfloat> @fma_mask_132_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <
; CHECK-LABEL: fma_mask_132_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 %zmm2, %zmm1, %zmm0 {%k1}
+; CHECK-NEXT: vfmadd132bf16 %zmm2, %zmm1, %zmm0 {%k1}
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %z, <32 x bfloat> %y)
%b = bitcast i32 %mask to <32 x i1>
@@ -1007,7 +1007,7 @@ define <32 x bfloat> @fma_mask_312_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <
; CHECK-LABEL: fma_mask_312_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %zmm1, %zmm2, %zmm0 {%k1}
+; CHECK-NEXT: vfmadd213bf16 %zmm1, %zmm2, %zmm0 {%k1}
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %x, <32 x bfloat> %y)
%b = bitcast i32 %mask to <32 x i1>
@@ -1019,7 +1019,7 @@ define <32 x bfloat> @fma_maskz_123_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y,
; CHECK-LABEL: fma_maskz_123_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z)
%b = bitcast i32 %mask to <32 x i1>
@@ -1031,7 +1031,7 @@ define <32 x bfloat> @fma_maskz_213_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y,
; CHECK-LABEL: fma_maskz_213_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %x, <32 x bfloat> %z)
%b = bitcast i32 %mask to <32 x i1>
@@ -1043,7 +1043,7 @@ define <32 x bfloat> @fma_maskz_231_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y,
; CHECK-LABEL: fma_maskz_231_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 %zmm1, %zmm2, %zmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd231bf16 %zmm1, %zmm2, %zmm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %z, <32 x bfloat> %x)
%b = bitcast i32 %mask to <32 x i1>
@@ -1055,7 +1055,7 @@ define <32 x bfloat> @fma_maskz_321_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y,
; CHECK-LABEL: fma_maskz_321_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 %zmm1, %zmm2, %zmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd231bf16 %zmm1, %zmm2, %zmm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %y, <32 x bfloat> %x)
%b = bitcast i32 %mask to <32 x i1>
@@ -1067,7 +1067,7 @@ define <32 x bfloat> @fma_maskz_132_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y,
; CHECK-LABEL: fma_maskz_132_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %zmm1, %zmm2, %zmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 %zmm1, %zmm2, %zmm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %z, <32 x bfloat> %y)
%b = bitcast i32 %mask to <32 x i1>
@@ -1079,7 +1079,7 @@ define <32 x bfloat> @fma_maskz_312_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y,
; CHECK-LABEL: fma_maskz_312_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %edi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 %zmm1, %zmm2, %zmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 %zmm1, %zmm2, %zmm0 {%k1} {z}
; CHECK-NEXT: retq
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %x, <32 x bfloat> %y)
%b = bitcast i32 %mask to <32 x i1>
@@ -1091,7 +1091,7 @@ define <32 x bfloat> @fma_mask_load_123_v32bf16(<32 x bfloat> %x, <32 x bfloat>
; CHECK-LABEL: fma_mask_load_123_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %zmm1, %zmm0 {%k1}
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %zmm1, %zmm0 {%k1}
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z)
@@ -1104,7 +1104,7 @@ define <32 x bfloat> @fma_mask_load_213_v32bf16(<32 x bfloat> %x, <32 x bfloat>
; CHECK-LABEL: fma_mask_load_213_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %zmm1, %zmm0 {%k1}
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %zmm1, %zmm0 {%k1}
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %x, <32 x bfloat> %z)
@@ -1117,7 +1117,7 @@ define <32 x bfloat> @fma_mask_load_231_v32bf16(<32 x bfloat> %x, <32 x bfloat>
; CHECK-LABEL: fma_mask_load_231_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %zmm1, %zmm0 {%k1}
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %zmm1, %zmm0 {%k1}
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %z, <32 x bfloat> %x)
@@ -1130,7 +1130,7 @@ define <32 x bfloat> @fma_mask_load_321_v32bf16(<32 x bfloat> %x, <32 x bfloat>
; CHECK-LABEL: fma_mask_load_321_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %zmm1, %zmm0 {%k1}
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %zmm1, %zmm0 {%k1}
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %y, <32 x bfloat> %x)
@@ -1143,7 +1143,7 @@ define <32 x bfloat> @fma_mask_load_132_v32bf16(<32 x bfloat> %x, <32 x bfloat>
; CHECK-LABEL: fma_mask_load_132_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %zmm1, %zmm0 {%k1}
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %zmm1, %zmm0 {%k1}
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %z, <32 x bfloat> %y)
@@ -1156,7 +1156,7 @@ define <32 x bfloat> @fma_mask_load_312_v32bf16(<32 x bfloat> %x, <32 x bfloat>
; CHECK-LABEL: fma_mask_load_312_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %zmm1, %zmm0 {%k1}
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %zmm1, %zmm0 {%k1}
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %x, <32 x bfloat> %y)
@@ -1169,7 +1169,7 @@ define <32 x bfloat> @fma_maskz_load_123_v32bf16(<32 x bfloat> %x, <32 x bfloat>
; CHECK-LABEL: fma_maskz_load_123_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %zmm1, %zmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %zmm1, %zmm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z)
@@ -1182,7 +1182,7 @@ define <32 x bfloat> @fma_maskz_load_213_v32bf16(<32 x bfloat> %x, <32 x bfloat>
; CHECK-LABEL: fma_maskz_load_213_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %zmm1, %zmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd213bf16 (%rdi), %zmm1, %zmm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %x, <32 x bfloat> %z)
@@ -1195,7 +1195,7 @@ define <32 x bfloat> @fma_maskz_load_231_v32bf16(<32 x bfloat> %x, <32 x bfloat>
; CHECK-LABEL: fma_maskz_load_231_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %zmm1, %zmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %zmm1, %zmm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %z, <32 x bfloat> %x)
@@ -1208,7 +1208,7 @@ define <32 x bfloat> @fma_maskz_load_321_v32bf16(<32 x bfloat> %x, <32 x bfloat>
; CHECK-LABEL: fma_maskz_load_321_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %zmm1, %zmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd231bf16 (%rdi), %zmm1, %zmm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %y, <32 x bfloat> %x)
@@ -1221,7 +1221,7 @@ define <32 x bfloat> @fma_maskz_load_132_v32bf16(<32 x bfloat> %x, <32 x bfloat>
; CHECK-LABEL: fma_maskz_load_132_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %zmm1, %zmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %zmm1, %zmm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %z, <32 x bfloat> %y)
@@ -1234,7 +1234,7 @@ define <32 x bfloat> @fma_maskz_load_312_v32bf16(<32 x bfloat> %x, <32 x bfloat>
; CHECK-LABEL: fma_maskz_load_312_v32bf16:
; CHECK: # %bb.0:
; CHECK-NEXT: kmovd %esi, %k1
-; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %zmm1, %zmm0 {%k1} {z}
+; CHECK-NEXT: vfmadd132bf16 (%rdi), %zmm1, %zmm0 {%k1} {z}
; CHECK-NEXT: retq
%z = load <32 x bfloat>, ptr %zp
%a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %x, <32 x bfloat> %y)
diff --git a/llvm/test/CodeGen/X86/avx10_2_512bf16-arith.ll b/llvm/test/CodeGen/X86/avx10_2_512bf16-arith.ll
index 33c40ac6bb32c7..1e2cf4956bd087 100644
--- a/llvm/test/CodeGen/X86/avx10_2_512bf16-arith.ll
+++ b/llvm/test/CodeGen/X86/avx10_2_512bf16-arith.ll
@@ -2,26 +2,26 @@
; RUN: llc < %s -verify-machineinstrs -mtriple=x86_64-unknown-unknown --show-mc-encoding -mattr=+avx10.2-512 | FileCheck %s --check-prefixes=CHECK,X64
; RUN: llc < %s -verify-machineinstrs -mtriple=i686-unknown-unknown --show-mc-encoding -mattr=+avx10.2-512 | FileCheck %s --check-prefixes=CHECK,X86
-define <32 x bfloat> @test_int_x86_avx10_vaddnepbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_vaddnepbf16512:
+define <32 x bfloat> @test_int_x86_avx10_vaddbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_vaddbf16512:
; CHECK: # %bb.0:
-; CHECK-NEXT: vaddnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x58,0xc1]
+; CHECK-NEXT: vaddbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x58,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%res = fadd <32 x bfloat> %x1, %x2
ret <32 x bfloat> %res
}
-define <32 x bfloat> @test_int_x86_avx10_mask_add_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_mask_add_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_mask_add_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_mask_add_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vaddnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x58,0xc2]
+; X64-NEXT: vaddbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x58,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_mask_add_nepbf16_512:
+; X86-LABEL: test_int_x86_avx10_mask_add_bf16_512:
; X86: # %bb.0:
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vaddnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x58,0xc2]
+; X86-NEXT: vaddbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x58,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i32 %msk to <32 x i1>
%res0 = fadd <32 x bfloat> %x1, %x2
@@ -29,22 +29,22 @@ define <32 x bfloat> @test_int_x86_avx10_mask_add_nepbf16_512(<32 x bfloat> %src
ret <32 x bfloat> %res
}
-define <32 x bfloat> @test_int_x86_avx10_maskz_add_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_maskz_add_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_maskz_add_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_maskz_add_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vaddnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0xc2]
-; X64-NEXT: vaddnepbf16 (%rsi), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0x0e]
-; X64-NEXT: vaddnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x58,0xc1]
+; X64-NEXT: vaddbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0xc2]
+; X64-NEXT: vaddbf16 (%rsi), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0x0e]
+; X64-NEXT: vaddbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x58,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_add_nepbf16_512:
+; X86-LABEL: test_int_x86_avx10_maskz_add_bf16_512:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08]
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vaddnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0xc2]
-; X86-NEXT: vaddnepbf16 (%eax), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0x08]
-; X86-NEXT: vaddnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x58,0xc1]
+; X86-NEXT: vaddbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0xc2]
+; X86-NEXT: vaddbf16 (%eax), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0x08]
+; X86-NEXT: vaddbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x58,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i32 %msk to <32 x i1>
%val = load <32 x bfloat>, ptr %ptr
@@ -56,26 +56,26 @@ define <32 x bfloat> @test_int_x86_avx10_maskz_add_nepbf16_512(<32 x bfloat> %sr
ret <32 x bfloat> %res3
}
-define <32 x bfloat> @test_int_x86_avx10_sub_nepbf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_sub_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_sub_bf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_sub_bf16_512:
; CHECK: # %bb.0:
-; CHECK-NEXT: vsubnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5c,0xc1]
+; CHECK-NEXT: vsubbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5c,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%res = fsub <32 x bfloat> %x1, %x2
ret <32 x bfloat> %res
}
-define <32 x bfloat> @test_int_x86_avx10_mask_sub_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_mask_sub_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_mask_sub_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_mask_sub_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vsubnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5c,0xc2]
+; X64-NEXT: vsubbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5c,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_mask_sub_nepbf16_512:
+; X86-LABEL: test_int_x86_avx10_mask_sub_bf16_512:
; X86: # %bb.0:
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vsubnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5c,0xc2]
+; X86-NEXT: vsubbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5c,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i32 %msk to <32 x i1>
%res0 = fsub <32 x bfloat> %x1, %x2
@@ -83,22 +83,22 @@ define <32 x bfloat> @test_int_x86_avx10_mask_sub_nepbf16_512(<32 x bfloat> %src
ret <32 x bfloat> %res
}
-define <32 x bfloat> @test_int_x86_avx10_maskz_sub_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_maskz_sub_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_maskz_sub_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_maskz_sub_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vsubnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5c,0xc2]
-; X64-NEXT: vsubnepbf16 (%rsi), %zmm1, %zmm1 # encoding: [0x62,0xf5,0x75,0x48,0x5c,0x0e]
-; X64-NEXT: vsubnepbf16 %zmm1, %zmm0, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x5c,0xc1]
+; X64-NEXT: vsubbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5c,0xc2]
+; X64-NEXT: vsubbf16 (%rsi), %zmm1, %zmm1 # encoding: [0x62,0xf5,0x75,0x48,0x5c,0x0e]
+; X64-NEXT: vsubbf16 %zmm1, %zmm0, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x5c,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_sub_nepbf16_512:
+; X86-LABEL: test_int_x86_avx10_maskz_sub_bf16_512:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08]
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vsubnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5c,0xc2]
-; X86-NEXT: vsubnepbf16 (%eax), %zmm1, %zmm1 # encoding: [0x62,0xf5,0x75,0x48,0x5c,0x08]
-; X86-NEXT: vsubnepbf16 %zmm1, %zmm0, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x5c,0xc1]
+; X86-NEXT: vsubbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5c,0xc2]
+; X86-NEXT: vsubbf16 (%eax), %zmm1, %zmm1 # encoding: [0x62,0xf5,0x75,0x48,0x5c,0x08]
+; X86-NEXT: vsubbf16 %zmm1, %zmm0, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x5c,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i32 %msk to <32 x i1>
%val = load <32 x bfloat>, ptr %ptr
@@ -110,28 +110,28 @@ define <32 x bfloat> @test_int_x86_avx10_maskz_sub_nepbf16_512(<32 x bfloat> %sr
ret <32 x bfloat> %res3
}
-declare <32 x bfloat> @llvm.x86.avx10.vmulnepbf16512(<32 x bfloat>, <32 x bfloat>)
+declare <32 x bfloat> @llvm.x86.avx10.vmulbf16512(<32 x bfloat>, <32 x bfloat>)
-define <32 x bfloat> @test_int_x86_avx10_mul_nepbf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_mul_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_mul_bf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_mul_bf16_512:
; CHECK: # %bb.0:
-; CHECK-NEXT: vmulnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x59,0xc1]
+; CHECK-NEXT: vmulbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x59,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%res = fmul <32 x bfloat> %x1, %x2
ret <32 x bfloat> %res
}
-define <32 x bfloat> @test_int_x86_avx10_mask_mul_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_mask_mul_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_mask_mul_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_mask_mul_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vmulnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x59,0xc2]
+; X64-NEXT: vmulbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x59,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_mask_mul_nepbf16_512:
+; X86-LABEL: test_int_x86_avx10_mask_mul_bf16_512:
; X86: # %bb.0:
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vmulnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x59,0xc2]
+; X86-NEXT: vmulbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x59,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i32 %msk to <32 x i1>
%res0 = fmul <32 x bfloat> %x1, %x2
@@ -139,22 +139,22 @@ define <32 x bfloat> @test_int_x86_avx10_mask_mul_nepbf16_512(<32 x bfloat> %src
ret <32 x bfloat> %res
}
-define <32 x bfloat> @test_int_x86_avx10_maskz_mul_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_maskz_mul_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_maskz_mul_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_maskz_mul_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vmulnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0xc2]
-; X64-NEXT: vmulnepbf16 (%rsi), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0x0e]
-; X64-NEXT: vmulnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x59,0xc1]
+; X64-NEXT: vmulbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0xc2]
+; X64-NEXT: vmulbf16 (%rsi), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0x0e]
+; X64-NEXT: vmulbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x59,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_mul_nepbf16_512:
+; X86-LABEL: test_int_x86_avx10_maskz_mul_bf16_512:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08]
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vmulnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0xc2]
-; X86-NEXT: vmulnepbf16 (%eax), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0x08]
-; X86-NEXT: vmulnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x59,0xc1]
+; X86-NEXT: vmulbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0xc2]
+; X86-NEXT: vmulbf16 (%eax), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0x08]
+; X86-NEXT: vmulbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x59,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i32 %msk to <32 x i1>
%val = load <32 x bfloat>, ptr %ptr
@@ -166,26 +166,26 @@ define <32 x bfloat> @test_int_x86_avx10_maskz_mul_nepbf16_512(<32 x bfloat> %sr
ret <32 x bfloat> %res3
}
-define <32 x bfloat> @test_int_x86_avx10_div_nepbf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_div_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_div_bf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_div_bf16_512:
; CHECK: # %bb.0:
-; CHECK-NEXT: vdivnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5e,0xc1]
+; CHECK-NEXT: vdivbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5e,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%res = fdiv <32 x bfloat> %x1, %x2
ret <32 x bfloat> %res
}
-define <32 x bfloat> @test_int_x86_avx10_mask_div_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_mask_div_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_mask_div_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_mask_div_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vdivnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5e,0xc2]
+; X64-NEXT: vdivbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5e,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_mask_div_nepbf16_512:
+; X86-LABEL: test_int_x86_avx10_mask_div_bf16_512:
; X86: # %bb.0:
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vdivnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5e,0xc2]
+; X86-NEXT: vdivbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5e,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i32 %msk to <32 x i1>
%res0 = fdiv <32 x bfloat> %x1, %x2
@@ -193,22 +193,22 @@ define <32 x bfloat> @test_int_x86_avx10_mask_div_nepbf16_512(<32 x bfloat> %src
ret <32 x bfloat> %res
}
-define <32 x bfloat> @test_int_x86_avx10_maskz_div_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_maskz_div_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_maskz_div_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_maskz_div_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vdivnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0xc2]
-; X64-NEXT: vdivnepbf16 (%rsi), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0x0e]
-; X64-NEXT: vdivnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5e,0xc1]
+; X64-NEXT: vdivbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0xc2]
+; X64-NEXT: vdivbf16 (%rsi), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0x0e]
+; X64-NEXT: vdivbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5e,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_div_nepbf16_512:
+; X86-LABEL: test_int_x86_avx10_maskz_div_bf16_512:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08]
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vdivnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0xc2]
-; X86-NEXT: vdivnepbf16 (%eax), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0x08]
-; X86-NEXT: vdivnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5e,0xc1]
+; X86-NEXT: vdivbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0xc2]
+; X86-NEXT: vdivbf16 (%eax), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0x08]
+; X86-NEXT: vdivbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5e,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i32 %msk to <32 x i1>
%val = load <32 x bfloat>, ptr %ptr
@@ -220,10 +220,10 @@ define <32 x bfloat> @test_int_x86_avx10_maskz_div_nepbf16_512(<32 x bfloat> %sr
ret <32 x bfloat> %res3
}
-define i32 @test_int_x86_avx10_vcmppbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_vcmppbf16512:
+define i32 @test_int_x86_avx10_vcmpbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_vcmpbf16512:
; CHECK: # %bb.0:
-; CHECK-NEXT: vcmpunordpbf16 %zmm1, %zmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x48,0xc2,0xc1,0x03]
+; CHECK-NEXT: vcmpunordbf16 %zmm1, %zmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x48,0xc2,0xc1,0x03]
; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0]
; CHECK-NEXT: vzeroupper # encoding: [0xc5,0xf8,0x77]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
@@ -233,10 +233,10 @@ define i32 @test_int_x86_avx10_vcmppbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2
}
; FIXME: _mm512_mask_cmp_p[s|h]_mask is not using {k2} but gcc does
-define i32 @test_int_x86_avx10_vcmppbf16512_mask2(<32 x bfloat> %x1, <32 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_vcmppbf16512_mask2:
+define i32 @test_int_x86_avx10_vcmpbf16512_mask2(<32 x bfloat> %x1, <32 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_vcmpbf16512_mask2:
; CHECK: # %bb.0:
-; CHECK-NEXT: vcmpeqpbf16 %zmm1, %zmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x48,0xc2,0xc1,0x00]
+; CHECK-NEXT: vcmpeqbf16 %zmm1, %zmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x48,0xc2,0xc1,0x00]
; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0]
; CHECK-NEXT: andl $3, %eax # encoding: [0x83,0xe0,0x03]
; CHECK-NEXT: vzeroupper # encoding: [0xc5,0xf8,0x77]
@@ -247,10 +247,10 @@ define i32 @test_int_x86_avx10_vcmppbf16512_mask2(<32 x bfloat> %x1, <32 x bfloa
ret i32 %3
}
-define <32 x bfloat> @test_sqrt_nepbf16_512(<32 x bfloat> %a0) {
-; CHECK-LABEL: test_sqrt_nepbf16_512:
+define <32 x bfloat> @test_sqrt_bf16_512(<32 x bfloat> %a0) {
+; CHECK-LABEL: test_sqrt_bf16_512:
; CHECK: # %bb.0:
-; CHECK-NEXT: vsqrtnepbf16 %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x51,0xc0]
+; CHECK-NEXT: vsqrtbf16 %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x51,0xc0]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%1 = tail call <32 x bfloat> @llvm.sqrt.v32bf16(<32 x bfloat> %a0)
ret <32 x bfloat> %1
@@ -260,13 +260,13 @@ define <32 x bfloat> @test_mm512_mask_sqrt_pbh(<32 x bfloat> %__W, i32 %__U, <32
; X64-LABEL: test_mm512_mask_sqrt_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vsqrtnepbf16 %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x51,0xc1]
+; X64-NEXT: vsqrtbf16 %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x51,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm512_mask_sqrt_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vsqrtnepbf16 %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x51,0xc1]
+; X86-NEXT: vsqrtbf16 %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x51,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%0 = tail call <32 x bfloat> @llvm.sqrt.v32bf16(<32 x bfloat> %__A)
@@ -279,13 +279,13 @@ define <32 x bfloat> @test_mm512_maskz_sqrt_pbh(i32 %__U, <32 x bfloat>%__A) {
; X64-LABEL: test_mm512_maskz_sqrt_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vsqrtnepbf16 %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x51,0xc0]
+; X64-NEXT: vsqrtbf16 %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x51,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm512_maskz_sqrt_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vsqrtnepbf16 %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x51,0xc0]
+; X86-NEXT: vsqrtbf16 %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x51,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%0 = tail call <32 x bfloat> @llvm.sqrt.v32bf16(<32 x bfloat> %__A)
@@ -297,7 +297,7 @@ entry:
define <32 x bfloat> @test_mm512_fmaddne_pbh(<32 x bfloat> %__A, <32 x bfloat> %__B, <32 x bfloat> %__C) {
; CHECK-LABEL: test_mm512_fmaddne_pbh:
; CHECK: # %bb.0: # %entry
-; CHECK-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xa8,0xc2]
+; CHECK-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xa8,0xc2]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
entry:
%0 = tail call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %__A, <32 x bfloat> %__B, <32 x bfloat> %__C)
@@ -308,13 +308,13 @@ define <32 x bfloat> @test_mm512_mask_fmaddne_pbh(<32 x bfloat> %__A, i32 %__U,
; X64-LABEL: test_mm512_mask_fmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmadd132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x98,0xc1]
+; X64-NEXT: vfmadd132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x98,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm512_mask_fmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmadd132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x98,0xc1]
+; X86-NEXT: vfmadd132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x98,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%0 = tail call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %__A, <32 x bfloat> %__B, <32 x bfloat> %__C)
@@ -327,14 +327,14 @@ define <32 x bfloat> @test_mm512_mask3_fmaddne_pbh(<32 x bfloat> %__A, <32 x bfl
; X64-LABEL: test_mm512_mask3_fmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmadd231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xb8,0xd1]
+; X64-NEXT: vfmadd231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xb8,0xd1]
; X64-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm512_mask3_fmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmadd231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xb8,0xd1]
+; X86-NEXT: vfmadd231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xb8,0xd1]
; X86-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
@@ -348,13 +348,13 @@ define <32 x bfloat> @test_mm512_maskz_fmaddne_pbh(i32 %__U, <32 x bfloat> %__A,
; X64-LABEL: test_mm512_maskz_fmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xa8,0xc2]
+; X64-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xa8,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm512_maskz_fmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xa8,0xc2]
+; X86-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xa8,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%0 = tail call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %__A, <32 x bfloat> %__B, <32 x bfloat> %__C)
@@ -366,7 +366,7 @@ entry:
define <32 x bfloat> @test_mm512_fmsubne_pbh(<32 x bfloat> %__A, <32 x bfloat> %__B, <32 x bfloat> %__C) {
; CHECK-LABEL: test_mm512_fmsubne_pbh:
; CHECK: # %bb.0: # %entry
-; CHECK-NEXT: vfmsub213nepbf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xaa,0xc2]
+; CHECK-NEXT: vfmsub213bf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xaa,0xc2]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
entry:
%fneg.i = fneg <32 x bfloat> %__C
@@ -378,13 +378,13 @@ define <32 x bfloat> @test_mm512_mask_fmsubne_pbh(<32 x bfloat> %__A, i32 %__U,
; X64-LABEL: test_mm512_mask_fmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmsub132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9a,0xc1]
+; X64-NEXT: vfmsub132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9a,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm512_mask_fmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmsub132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9a,0xc1]
+; X86-NEXT: vfmsub132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9a,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <32 x bfloat> %__C
@@ -398,14 +398,14 @@ define <32 x bfloat> @test_mm512_mask3_fmsubne_pbh(<32 x bfloat> %__A, <32 x bfl
; X64-LABEL: test_mm512_mask3_fmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmsub231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xba,0xd1]
+; X64-NEXT: vfmsub231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xba,0xd1]
; X64-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm512_mask3_fmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmsub231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xba,0xd1]
+; X86-NEXT: vfmsub231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xba,0xd1]
; X86-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
@@ -420,13 +420,13 @@ define <32 x bfloat> @test_mm512_maskz_fmsubne_pbh(i32 %__U, <32 x bfloat> %__A,
; X64-LABEL: test_mm512_maskz_fmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmsub213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xaa,0xc2]
+; X64-NEXT: vfmsub213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xaa,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm512_maskz_fmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmsub213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xaa,0xc2]
+; X86-NEXT: vfmsub213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xaa,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <32 x bfloat> %__C
@@ -439,7 +439,7 @@ entry:
define <32 x bfloat> @test_mm512_fnmaddne_pbh(<32 x bfloat> %__A, <32 x bfloat> %__B, <32 x bfloat> %__C) {
; CHECK-LABEL: test_mm512_fnmaddne_pbh:
; CHECK: # %bb.0: # %entry
-; CHECK-NEXT: vfnmadd213nepbf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xac,0xc2]
+; CHECK-NEXT: vfnmadd213bf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xac,0xc2]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
entry:
%fneg.i = fneg <32 x bfloat> %__B
@@ -451,13 +451,13 @@ define <32 x bfloat> @test_mm512_mask_fnmaddne_pbh(<32 x bfloat> %__A, i32 %__U,
; X64-LABEL: test_mm512_mask_fnmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmadd132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9c,0xc1]
+; X64-NEXT: vfnmadd132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9c,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm512_mask_fnmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmadd132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9c,0xc1]
+; X86-NEXT: vfnmadd132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9c,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <32 x bfloat> %__B
@@ -471,14 +471,14 @@ define <32 x bfloat> @test_mm512_mask3_fnmaddne_pbh(<32 x bfloat> %__A, <32 x bf
; X64-LABEL: test_mm512_mask3_fnmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmadd231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbc,0xd1]
+; X64-NEXT: vfnmadd231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbc,0xd1]
; X64-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm512_mask3_fnmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmadd231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbc,0xd1]
+; X86-NEXT: vfnmadd231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbc,0xd1]
; X86-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
@@ -493,13 +493,13 @@ define <32 x bfloat> @test_mm512_maskz_fnmaddne_pbh(i32 %__U, <32 x bfloat> %__A
; X64-LABEL: test_mm512_maskz_fnmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmadd213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xac,0xc2]
+; X64-NEXT: vfnmadd213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xac,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm512_maskz_fnmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmadd213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xac,0xc2]
+; X86-NEXT: vfnmadd213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xac,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <32 x bfloat> %__B
@@ -512,7 +512,7 @@ entry:
define <32 x bfloat> @test_mm512_fnmsubne_pbh(<32 x bfloat> %__A, <32 x bfloat> %__B, <32 x bfloat> %__C) {
; CHECK-LABEL: test_mm512_fnmsubne_pbh:
; CHECK: # %bb.0: # %entry
-; CHECK-NEXT: vfnmsub213nepbf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xae,0xc2]
+; CHECK-NEXT: vfnmsub213bf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xae,0xc2]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
entry:
%fneg.i = fneg <32 x bfloat> %__B
@@ -525,13 +525,13 @@ define <32 x bfloat> @test_mm512_mask_fnmsubne_pbh(<32 x bfloat> %__A, i32 %__U,
; X64-LABEL: test_mm512_mask_fnmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmsub132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9e,0xc1]
+; X64-NEXT: vfnmsub132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9e,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm512_mask_fnmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmsub132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9e,0xc1]
+; X86-NEXT: vfnmsub132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9e,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <32 x bfloat> %__B
@@ -546,14 +546,14 @@ define <32 x bfloat> @test_mm512_mask3_fnmsubne_pbh(<32 x bfloat> %__A, <32 x bf
; X64-LABEL: test_mm512_mask3_fnmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmsub231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbe,0xd1]
+; X64-NEXT: vfnmsub231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbe,0xd1]
; X64-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm512_mask3_fnmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmsub231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbe,0xd1]
+; X86-NEXT: vfnmsub231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbe,0xd1]
; X86-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
@@ -569,13 +569,13 @@ define <32 x bfloat> @test_mm512_maskz_fnmsubne_pbh(i32 %__U, <32 x bfloat> %__A
; X64-LABEL: test_mm512_maskz_fnmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmsub213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xae,0xc2]
+; X64-NEXT: vfnmsub213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xae,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm512_maskz_fnmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmsub213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xae,0xc2]
+; X86-NEXT: vfnmsub213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xae,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <32 x bfloat> %__B
diff --git a/llvm/test/CodeGen/X86/avx10_2_512bf16-intrinsics.ll b/llvm/test/CodeGen/X86/avx10_2_512bf16-intrinsics.ll
index 5f2bcf0556b021..da17b995afedf2 100644
--- a/llvm/test/CodeGen/X86/avx10_2_512bf16-intrinsics.ll
+++ b/llvm/test/CodeGen/X86/avx10_2_512bf16-intrinsics.ll
@@ -2,231 +2,231 @@
; RUN: llc < %s -verify-machineinstrs -mtriple=x86_64-unknown-unknown --show-mc-encoding -mattr=+avx10.2-512 | FileCheck %s --check-prefixes=CHECK,X64
; RUN: llc < %s -verify-machineinstrs -mtriple=i686-unknown-unknown --show-mc-encoding -mattr=+avx10.2-512 | FileCheck %s --check-prefixes=CHECK,X86
-declare <32 x bfloat> @llvm.x86.avx10.vminpbf16512(<32 x bfloat>, <32 x bfloat>)
+declare <32 x bfloat> @llvm.x86.avx10.vminbf16512(<32 x bfloat>, <32 x bfloat>)
-define <32 x bfloat> @test_int_x86_avx10_min_nepbf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_min_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_min_bf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_min_bf16_512:
; CHECK: # %bb.0:
-; CHECK-NEXT: vminpbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5d,0xc1]
+; CHECK-NEXT: vminbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5d,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res0 = call <32 x bfloat> @llvm.x86.avx10.vminpbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2)
+ %res0 = call <32 x bfloat> @llvm.x86.avx10.vminbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2)
ret <32 x bfloat> %res0
}
-define <32 x bfloat> @test_int_x86_avx10_maskz_min_nepbf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk) {
-; X64-LABEL: test_int_x86_avx10_maskz_min_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_maskz_min_bf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk) {
+; X64-LABEL: test_int_x86_avx10_maskz_min_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vminpbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5d,0xc1]
+; X64-NEXT: vminbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5d,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_min_nepbf16_512:
+; X86-LABEL: test_int_x86_avx10_maskz_min_bf16_512:
; X86: # %bb.0:
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vminpbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5d,0xc1]
+; X86-NEXT: vminbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5d,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i32 %msk to <32 x i1>
- %res0 = call <32 x bfloat> @llvm.x86.avx10.vminpbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2)
+ %res0 = call <32 x bfloat> @llvm.x86.avx10.vminbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2)
%res1 = select <32 x i1> %mask, <32 x bfloat> %res0, <32 x bfloat> zeroinitializer
ret <32 x bfloat> %res1
}
-declare <32 x bfloat> @llvm.x86.avx10.vmaxpbf16512(<32 x bfloat>, <32 x bfloat>)
+declare <32 x bfloat> @llvm.x86.avx10.vmaxbf16512(<32 x bfloat>, <32 x bfloat>)
-define <32 x bfloat> @test_int_x86_avx10_max_nepbf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_max_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_max_bf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_max_bf16_512:
; CHECK: # %bb.0:
-; CHECK-NEXT: vmaxpbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5f,0xc1]
+; CHECK-NEXT: vmaxbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5f,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res0 = call <32 x bfloat> @llvm.x86.avx10.vmaxpbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2)
+ %res0 = call <32 x bfloat> @llvm.x86.avx10.vmaxbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2)
ret <32 x bfloat> %res0
}
-define <32 x bfloat> @test_int_x86_avx10_maskz_max_nepbf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk) {
-; X64-LABEL: test_int_x86_avx10_maskz_max_nepbf16_512:
+define <32 x bfloat> @test_int_x86_avx10_maskz_max_bf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk) {
+; X64-LABEL: test_int_x86_avx10_maskz_max_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vmaxpbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5f,0xc1]
+; X64-NEXT: vmaxbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5f,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_max_nepbf16_512:
+; X86-LABEL: test_int_x86_avx10_maskz_max_bf16_512:
; X86: # %bb.0:
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vmaxpbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5f,0xc1]
+; X86-NEXT: vmaxbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5f,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i32 %msk to <32 x i1>
- %res0 = call <32 x bfloat> @llvm.x86.avx10.vmaxpbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2)
+ %res0 = call <32 x bfloat> @llvm.x86.avx10.vmaxbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2)
%res1 = select <32 x i1> %mask, <32 x bfloat> %res0, <32 x bfloat> zeroinitializer
ret <32 x bfloat> %res1
}
-declare <32 x bfloat> @llvm.x86.avx10.mask.rsqrt.nepbf16.512(<32 x bfloat>, <32 x bfloat>, i32)
+declare <32 x bfloat> @llvm.x86.avx10.mask.rsqrt.bf16.512(<32 x bfloat>, <32 x bfloat>, i32)
-define <32 x bfloat> @test_rsqrt_nepbf16_512(<32 x bfloat> %a0) {
-; CHECK-LABEL: test_rsqrt_nepbf16_512:
+define <32 x bfloat> @test_rsqrt_bf16_512(<32 x bfloat> %a0) {
+; CHECK-LABEL: test_rsqrt_bf16_512:
; CHECK: # %bb.0:
-; CHECK-NEXT: vrsqrtpbf16 %zmm0, %zmm0 # encoding: [0x62,0xf6,0x7c,0x48,0x4e,0xc0]
+; CHECK-NEXT: vrsqrtbf16 %zmm0, %zmm0 # encoding: [0x62,0xf6,0x7c,0x48,0x4e,0xc0]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res = call <32 x bfloat> @llvm.x86.avx10.mask.rsqrt.nepbf16.512(<32 x bfloat> %a0, <32 x bfloat> zeroinitializer, i32 -1)
+ %res = call <32 x bfloat> @llvm.x86.avx10.mask.rsqrt.bf16.512(<32 x bfloat> %a0, <32 x bfloat> zeroinitializer, i32 -1)
ret <32 x bfloat> %res
}
-declare <32 x i1> @llvm.x86.avx10.fpclass.nepbf16.512(<32 x bfloat>, i32)
+declare <32 x i1> @llvm.x86.avx10.fpclass.bf16.512(<32 x bfloat>, i32)
-define i32 @test_int_x86_avx512_fpclass_nepbf16_512(<32 x bfloat> %x0) {
-; CHECK-LABEL: test_int_x86_avx512_fpclass_nepbf16_512:
+define i32 @test_int_x86_avx512_fpclass_bf16_512(<32 x bfloat> %x0) {
+; CHECK-LABEL: test_int_x86_avx512_fpclass_bf16_512:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfpclasspbf16 $6, %zmm0, %k1 # encoding: [0x62,0xf3,0x7f,0x48,0x66,0xc8,0x06]
+; CHECK-NEXT: vfpclassbf16 $6, %zmm0, %k1 # encoding: [0x62,0xf3,0x7f,0x48,0x66,0xc8,0x06]
; CHECK-NEXT: # k1 = isPositiveZero(zmm0) | isNegativeZero(zmm0)
-; CHECK-NEXT: vfpclasspbf16 $0, %zmm0, %k0 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x66,0xc0,0x00]
+; CHECK-NEXT: vfpclassbf16 $0, %zmm0, %k0 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x66,0xc0,0x00]
; CHECK-NEXT: # k0 {%k1} = false
; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0]
; CHECK-NEXT: vzeroupper # encoding: [0xc5,0xf8,0x77]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res = call <32 x i1> @llvm.x86.avx10.fpclass.nepbf16.512(<32 x bfloat> %x0, i32 0)
- %res1 = call <32 x i1> @llvm.x86.avx10.fpclass.nepbf16.512(<32 x bfloat> %x0, i32 6)
+ %res = call <32 x i1> @llvm.x86.avx10.fpclass.bf16.512(<32 x bfloat> %x0, i32 0)
+ %res1 = call <32 x i1> @llvm.x86.avx10.fpclass.bf16.512(<32 x bfloat> %x0, i32 6)
%1 = and <32 x i1> %res1, %res
%2 = bitcast <32 x i1> %1 to i32
ret i32 %2
}
-declare <32 x bfloat> @llvm.x86.avx10.mask.rcp.nepbf16.512(<32 x bfloat>, <32 x bfloat>, i32)
+declare <32 x bfloat> @llvm.x86.avx10.mask.rcp.bf16.512(<32 x bfloat>, <32 x bfloat>, i32)
-define <32 x bfloat> @test_rcp_nepbf16_512(<32 x bfloat> %a0, <32 x bfloat> %a1, i32 %mask) {
-; X64-LABEL: test_rcp_nepbf16_512:
+define <32 x bfloat> @test_rcp_bf16_512(<32 x bfloat> %a0, <32 x bfloat> %a1, i32 %mask) {
+; X64-LABEL: test_rcp_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vrcppbf16 %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0x4c,0xc8]
+; X64-NEXT: vrcpbf16 %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0x4c,0xc8]
; X64-NEXT: vmovaps %zmm1, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_rcp_nepbf16_512:
+; X86-LABEL: test_rcp_bf16_512:
; X86: # %bb.0:
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vrcppbf16 %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0x4c,0xc8]
+; X86-NEXT: vrcpbf16 %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0x4c,0xc8]
; X86-NEXT: vmovaps %zmm1, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <32 x bfloat> @llvm.x86.avx10.mask.rcp.nepbf16.512(<32 x bfloat> %a0, <32 x bfloat> %a1, i32 %mask)
+ %res = call <32 x bfloat> @llvm.x86.avx10.mask.rcp.bf16.512(<32 x bfloat> %a0, <32 x bfloat> %a1, i32 %mask)
ret <32 x bfloat> %res
}
-declare <32 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.512(<32 x bfloat>, i32, <32 x bfloat>, i32)
+declare <32 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.512(<32 x bfloat>, i32, <32 x bfloat>, i32)
-define <32 x bfloat>@test_int_x86_avx512_mask_reduce_nepbf16_512(<32 x bfloat> %x0, <32 x bfloat> %x2, i32 %x3) {
-; X64-LABEL: test_int_x86_avx512_mask_reduce_nepbf16_512:
+define <32 x bfloat>@test_int_x86_avx512_mask_reduce_bf16_512(<32 x bfloat> %x0, <32 x bfloat> %x2, i32 %x3) {
+; X64-LABEL: test_int_x86_avx512_mask_reduce_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vreducenepbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x56,0xc8,0x08]
-; X64-NEXT: vreducenepbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x56,0xc0,0x04]
-; X64-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
+; X64-NEXT: vreducebf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x56,0xc8,0x08]
+; X64-NEXT: vreducebf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x56,0xc0,0x04]
+; X64-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_reduce_nepbf16_512:
+; X86-LABEL: test_int_x86_avx512_mask_reduce_bf16_512:
; X86: # %bb.0:
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vreducenepbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x56,0xc8,0x08]
-; X86-NEXT: vreducenepbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x56,0xc0,0x04]
-; X86-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
+; X86-NEXT: vreducebf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x56,0xc8,0x08]
+; X86-NEXT: vreducebf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x56,0xc0,0x04]
+; X86-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <32 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.512(<32 x bfloat> %x0, i32 8, <32 x bfloat> %x2, i32 %x3)
- %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.512(<32 x bfloat> %x0, i32 4, <32 x bfloat> %x2, i32 -1)
+ %res = call <32 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.512(<32 x bfloat> %x0, i32 8, <32 x bfloat> %x2, i32 %x3)
+ %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.512(<32 x bfloat> %x0, i32 4, <32 x bfloat> %x2, i32 -1)
%res2 = fadd <32 x bfloat> %res, %res1
ret <32 x bfloat> %res2
}
-declare <32 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.512(<32 x bfloat>, i32, <32 x bfloat>, i32)
+declare <32 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.512(<32 x bfloat>, i32, <32 x bfloat>, i32)
-define <32 x bfloat>@test_int_x86_avx512_mask_rndscale_nepbf16_512(<32 x bfloat> %x0, <32 x bfloat> %x2, i32 %x3) {
-; X64-LABEL: test_int_x86_avx512_mask_rndscale_nepbf16_512:
+define <32 x bfloat>@test_int_x86_avx512_mask_rndscale_bf16_512(<32 x bfloat> %x0, <32 x bfloat> %x2, i32 %x3) {
+; X64-LABEL: test_int_x86_avx512_mask_rndscale_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vrndscalenepbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x08,0xc8,0x08]
-; X64-NEXT: vrndscalenepbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x08,0xc0,0x04]
-; X64-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
+; X64-NEXT: vrndscalebf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x08,0xc8,0x08]
+; X64-NEXT: vrndscalebf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x08,0xc0,0x04]
+; X64-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_rndscale_nepbf16_512:
+; X86-LABEL: test_int_x86_avx512_mask_rndscale_bf16_512:
; X86: # %bb.0:
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vrndscalenepbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x08,0xc8,0x08]
-; X86-NEXT: vrndscalenepbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x08,0xc0,0x04]
-; X86-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
+; X86-NEXT: vrndscalebf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x08,0xc8,0x08]
+; X86-NEXT: vrndscalebf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x08,0xc0,0x04]
+; X86-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <32 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.512(<32 x bfloat> %x0, i32 8, <32 x bfloat> %x2, i32 %x3)
- %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.512(<32 x bfloat> %x0, i32 4, <32 x bfloat> %x2, i32 -1)
+ %res = call <32 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.512(<32 x bfloat> %x0, i32 8, <32 x bfloat> %x2, i32 %x3)
+ %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.512(<32 x bfloat> %x0, i32 4, <32 x bfloat> %x2, i32 -1)
%res2 = fadd <32 x bfloat> %res, %res1
ret <32 x bfloat> %res2
}
-declare <32 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.512(<32 x bfloat>, <32 x bfloat>, i32)
+declare <32 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.512(<32 x bfloat>, <32 x bfloat>, i32)
-define <32 x bfloat>@test_int_x86_avx512_mask_getexp_nepbf16_512(<32 x bfloat> %x0, <32 x bfloat> %x1, i32 %x2) {
-; X64-LABEL: test_int_x86_avx512_mask_getexp_nepbf16_512:
+define <32 x bfloat>@test_int_x86_avx512_mask_getexp_bf16_512(<32 x bfloat> %x0, <32 x bfloat> %x1, i32 %x2) {
+; X64-LABEL: test_int_x86_avx512_mask_getexp_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vgetexppbf16 %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x42,0xc0]
+; X64-NEXT: vgetexpbf16 %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x42,0xc0]
; X64-NEXT: vmovdqu16 %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf1,0xff,0x49,0x6f,0xc8]
-; X64-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
+; X64-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_getexp_nepbf16_512:
+; X86-LABEL: test_int_x86_avx512_mask_getexp_bf16_512:
; X86: # %bb.0:
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vgetexppbf16 %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x42,0xc0]
+; X86-NEXT: vgetexpbf16 %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x42,0xc0]
; X86-NEXT: vmovdqu16 %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf1,0xff,0x49,0x6f,0xc8]
-; X86-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
+; X86-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
- %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.512(<32 x bfloat> %x0, <32 x bfloat> %x1, i32 %x2)
- %res2 = call <32 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.512(<32 x bfloat> %x0, <32 x bfloat> zeroinitializer, i32 -1)
+ %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.512(<32 x bfloat> %x0, <32 x bfloat> %x1, i32 %x2)
+ %res2 = call <32 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.512(<32 x bfloat> %x0, <32 x bfloat> zeroinitializer, i32 -1)
%res3 = fadd <32 x bfloat> %res1, %res2
ret <32 x bfloat> %res3
}
-declare <32 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.512(<32 x bfloat>, i32, <32 x bfloat>, i32)
+declare <32 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.512(<32 x bfloat>, i32, <32 x bfloat>, i32)
-define <32 x bfloat>@test_int_x86_avx512_mask_getmant_nepbf16_512(<32 x bfloat> %x0, <32 x bfloat> %x2, i32 %x3) {
-; X64-LABEL: test_int_x86_avx512_mask_getmant_nepbf16_512:
+define <32 x bfloat>@test_int_x86_avx512_mask_getmant_bf16_512(<32 x bfloat> %x0, <32 x bfloat> %x2, i32 %x3) {
+; X64-LABEL: test_int_x86_avx512_mask_getmant_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vgetmantpbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x26,0xc8,0x08]
-; X64-NEXT: vgetmantpbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x26,0xc0,0x04]
-; X64-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
+; X64-NEXT: vgetmantbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x26,0xc8,0x08]
+; X64-NEXT: vgetmantbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x26,0xc0,0x04]
+; X64-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_getmant_nepbf16_512:
+; X86-LABEL: test_int_x86_avx512_mask_getmant_bf16_512:
; X86: # %bb.0:
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vgetmantpbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x26,0xc8,0x08]
-; X86-NEXT: vgetmantpbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x26,0xc0,0x04]
-; X86-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
+; X86-NEXT: vgetmantbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x26,0xc8,0x08]
+; X86-NEXT: vgetmantbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x26,0xc0,0x04]
+; X86-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <32 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.512(<32 x bfloat> %x0, i32 8, <32 x bfloat> %x2, i32 %x3)
- %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.512(<32 x bfloat> %x0, i32 4, <32 x bfloat> %x2, i32 -1)
+ %res = call <32 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.512(<32 x bfloat> %x0, i32 8, <32 x bfloat> %x2, i32 %x3)
+ %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.512(<32 x bfloat> %x0, i32 4, <32 x bfloat> %x2, i32 -1)
%res2 = fadd <32 x bfloat> %res, %res1
ret <32 x bfloat> %res2
}
-declare <32 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.512(<32 x bfloat>, <32 x bfloat>, <32 x bfloat>, i32)
+declare <32 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.512(<32 x bfloat>, <32 x bfloat>, <32 x bfloat>, i32)
-define <32 x bfloat>@test_int_x86_avx512_mask_scalef_nepbf16_512(<32 x bfloat> %x0, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %x3) {
-; X64-LABEL: test_int_x86_avx512_mask_scalef_nepbf16_512:
+define <32 x bfloat>@test_int_x86_avx512_mask_scalef_bf16_512(<32 x bfloat> %x0, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %x3) {
+; X64-LABEL: test_int_x86_avx512_mask_scalef_bf16_512:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vscalefpbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf6,0x7c,0x48,0x2c,0xc1]
+; X64-NEXT: vscalefbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf6,0x7c,0x48,0x2c,0xc1]
; X64-NEXT: vmovdqu16 %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf1,0xff,0x49,0x6f,0xd0]
-; X64-NEXT: vaddnepbf16 %zmm0, %zmm2, %zmm0 # encoding: [0x62,0xf5,0x6d,0x48,0x58,0xc0]
+; X64-NEXT: vaddbf16 %zmm0, %zmm2, %zmm0 # encoding: [0x62,0xf5,0x6d,0x48,0x58,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_scalef_nepbf16_512:
+; X86-LABEL: test_int_x86_avx512_mask_scalef_bf16_512:
; X86: # %bb.0:
; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vscalefpbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf6,0x7c,0x48,0x2c,0xc1]
+; X86-NEXT: vscalefbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf6,0x7c,0x48,0x2c,0xc1]
; X86-NEXT: vmovdqu16 %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf1,0xff,0x49,0x6f,0xd0]
-; X86-NEXT: vaddnepbf16 %zmm0, %zmm2, %zmm0 # encoding: [0x62,0xf5,0x6d,0x48,0x58,0xc0]
+; X86-NEXT: vaddbf16 %zmm0, %zmm2, %zmm0 # encoding: [0x62,0xf5,0x6d,0x48,0x58,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i32 %x3 to <32 x i1>
- %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.512(<32 x bfloat> %x0, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %x3)
- %res2 = call <32 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.512(<32 x bfloat> %x0, <32 x bfloat> %x1, <32 x bfloat> zeroinitializer, i32 -1)
+ %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.512(<32 x bfloat> %x0, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %x3)
+ %res2 = call <32 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.512(<32 x bfloat> %x0, <32 x bfloat> %x1, <32 x bfloat> zeroinitializer, i32 -1)
%res3 = fadd <32 x bfloat> %res1, %res2
ret <32 x bfloat> %res3
}
diff --git a/llvm/test/CodeGen/X86/avx10_2bf16-arith.ll b/llvm/test/CodeGen/X86/avx10_2bf16-arith.ll
index c97d27ff324bbb..42831a453cb1dd 100644
--- a/llvm/test/CodeGen/X86/avx10_2bf16-arith.ll
+++ b/llvm/test/CodeGen/X86/avx10_2bf16-arith.ll
@@ -2,48 +2,48 @@
; RUN: llc < %s -verify-machineinstrs -mtriple=x86_64-unknown-unknown --show-mc-encoding -mattr=+avx10.2-256 | FileCheck %s --check-prefixes=CHECK,X64
; RUN: llc < %s -verify-machineinstrs -mtriple=i686-unknown-unknown --show-mc-encoding -mattr=+avx10.2-256 | FileCheck %s --check-prefixes=CHECK,X86
-define <16 x bfloat> @test_int_x86_avx10_add_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_add_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_add_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_add_bf16_256:
; CHECK: # %bb.0:
-; CHECK-NEXT: vaddnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc1]
+; CHECK-NEXT: vaddbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%res = fadd <16 x bfloat> %x1, %x2
ret <16 x bfloat> %res
}
-define <16 x bfloat> @test_int_x86_avx10_mask_add_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_mask_add_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_mask_add_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_mask_add_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vaddnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x58,0xc2]
+; X64-NEXT: vaddbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x58,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_mask_add_nepbf16_256:
+; X86-LABEL: test_int_x86_avx10_mask_add_bf16_256:
; X86: # %bb.0:
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vaddnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x58,0xc2]
+; X86-NEXT: vaddbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x58,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i16 %msk to <16 x i1>
%res0 = fadd <16 x bfloat> %x1, %x2
%res = select <16 x i1> %mask, <16 x bfloat> %res0, <16 x bfloat> %src
ret <16 x bfloat> %res
}
-define <16 x bfloat> @test_int_x86_avx10_maskz_add_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_maskz_add_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_maskz_add_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_maskz_add_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vaddnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0xc2]
-; X64-NEXT: vaddnepbf16 (%rsi), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0x0e]
-; X64-NEXT: vaddnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc1]
+; X64-NEXT: vaddbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0xc2]
+; X64-NEXT: vaddbf16 (%rsi), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0x0e]
+; X64-NEXT: vaddbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_add_nepbf16_256:
+; X86-LABEL: test_int_x86_avx10_maskz_add_bf16_256:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08]
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vaddnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0xc2]
-; X86-NEXT: vaddnepbf16 (%eax), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0x08]
-; X86-NEXT: vaddnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc1]
+; X86-NEXT: vaddbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0xc2]
+; X86-NEXT: vaddbf16 (%eax), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0x08]
+; X86-NEXT: vaddbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i16 %msk to <16 x i1>
%val = load <16 x bfloat>, ptr %ptr
@@ -55,26 +55,26 @@ define <16 x bfloat> @test_int_x86_avx10_maskz_add_nepbf16_256(<16 x bfloat> %sr
ret <16 x bfloat> %res3
}
-define <8 x bfloat> @test_int_x86_avx10_add_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_add_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_add_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_add_bf16_128:
; CHECK: # %bb.0:
-; CHECK-NEXT: vaddnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x58,0xc1]
+; CHECK-NEXT: vaddbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x58,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%res = fadd <8 x bfloat> %x1, %x2
ret <8 x bfloat> %res
}
-define <8 x bfloat> @test_int_x86_avx10_mask_add_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_mask_add_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_mask_add_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_mask_add_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vaddnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x58,0xc2]
+; X64-NEXT: vaddbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x58,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_mask_add_nepbf16_128:
+; X86-LABEL: test_int_x86_avx10_mask_add_bf16_128:
; X86: # %bb.0:
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vaddnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x58,0xc2]
+; X86-NEXT: vaddbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x58,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i8 %msk to <8 x i1>
%res0 = fadd <8 x bfloat> %x1, %x2
@@ -82,22 +82,22 @@ define <8 x bfloat> @test_int_x86_avx10_mask_add_nepbf16_128(<8 x bfloat> %src,
ret <8 x bfloat> %res
}
-define <8 x bfloat> @test_int_x86_avx10_maskz_add_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_maskz_add_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_maskz_add_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_maskz_add_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vaddnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0xc2]
-; X64-NEXT: vaddnepbf16 (%rsi), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0x0e]
-; X64-NEXT: vaddnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x58,0xc1]
+; X64-NEXT: vaddbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0xc2]
+; X64-NEXT: vaddbf16 (%rsi), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0x0e]
+; X64-NEXT: vaddbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x58,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_add_nepbf16_128:
+; X86-LABEL: test_int_x86_avx10_maskz_add_bf16_128:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08]
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vaddnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0xc2]
-; X86-NEXT: vaddnepbf16 (%eax), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0x08]
-; X86-NEXT: vaddnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x58,0xc1]
+; X86-NEXT: vaddbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0xc2]
+; X86-NEXT: vaddbf16 (%eax), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0x08]
+; X86-NEXT: vaddbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x58,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i8 %msk to <8 x i1>
%val = load <8 x bfloat>, ptr %ptr
@@ -109,26 +109,26 @@ define <8 x bfloat> @test_int_x86_avx10_maskz_add_nepbf16_128(<8 x bfloat> %src,
ret <8 x bfloat> %res3
}
-define <16 x bfloat> @test_int_x86_avx10_sub_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_sub_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_sub_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_sub_bf16_256:
; CHECK: # %bb.0:
-; CHECK-NEXT: vsubnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5c,0xc1]
+; CHECK-NEXT: vsubbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5c,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%res = fsub <16 x bfloat> %x1, %x2
ret <16 x bfloat> %res
}
-define <16 x bfloat> @test_int_x86_avx10_mask_sub_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_mask_sub_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_mask_sub_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_mask_sub_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vsubnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5c,0xc2]
+; X64-NEXT: vsubbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5c,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_mask_sub_nepbf16_256:
+; X86-LABEL: test_int_x86_avx10_mask_sub_bf16_256:
; X86: # %bb.0:
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vsubnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5c,0xc2]
+; X86-NEXT: vsubbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5c,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i16 %msk to <16 x i1>
%res0 = fsub <16 x bfloat> %x1, %x2
@@ -136,22 +136,22 @@ define <16 x bfloat> @test_int_x86_avx10_mask_sub_nepbf16_256(<16 x bfloat> %src
ret <16 x bfloat> %res
}
-define <16 x bfloat> @test_int_x86_avx10_maskz_sub_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_maskz_sub_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_maskz_sub_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_maskz_sub_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vsubnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5c,0xc2]
-; X64-NEXT: vsubnepbf16 (%rsi), %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x5c,0x0e]
-; X64-NEXT: vsubnepbf16 %ymm1, %ymm0, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x5c,0xc1]
+; X64-NEXT: vsubbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5c,0xc2]
+; X64-NEXT: vsubbf16 (%rsi), %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x5c,0x0e]
+; X64-NEXT: vsubbf16 %ymm1, %ymm0, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x5c,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_sub_nepbf16_256:
+; X86-LABEL: test_int_x86_avx10_maskz_sub_bf16_256:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08]
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vsubnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5c,0xc2]
-; X86-NEXT: vsubnepbf16 (%eax), %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x5c,0x08]
-; X86-NEXT: vsubnepbf16 %ymm1, %ymm0, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x5c,0xc1]
+; X86-NEXT: vsubbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5c,0xc2]
+; X86-NEXT: vsubbf16 (%eax), %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x5c,0x08]
+; X86-NEXT: vsubbf16 %ymm1, %ymm0, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x5c,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i16 %msk to <16 x i1>
%val = load <16 x bfloat>, ptr %ptr
@@ -163,26 +163,26 @@ define <16 x bfloat> @test_int_x86_avx10_maskz_sub_nepbf16_256(<16 x bfloat> %sr
ret <16 x bfloat> %res3
}
-define <8 x bfloat> @test_int_x86_avx10_sub_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_sub_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_sub_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_sub_bf16_128:
; CHECK: # %bb.0:
-; CHECK-NEXT: vsubnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5c,0xc1]
+; CHECK-NEXT: vsubbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5c,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%res = fsub <8 x bfloat> %x1, %x2
ret <8 x bfloat> %res
}
-define <8 x bfloat> @test_int_x86_avx10_mask_sub_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_mask_sub_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_mask_sub_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_mask_sub_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vsubnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5c,0xc2]
+; X64-NEXT: vsubbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5c,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_mask_sub_nepbf16_128:
+; X86-LABEL: test_int_x86_avx10_mask_sub_bf16_128:
; X86: # %bb.0:
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vsubnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5c,0xc2]
+; X86-NEXT: vsubbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5c,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i8 %msk to <8 x i1>
%res0 = fsub <8 x bfloat> %x1, %x2
@@ -190,22 +190,22 @@ define <8 x bfloat> @test_int_x86_avx10_mask_sub_nepbf16_128(<8 x bfloat> %src,
ret <8 x bfloat> %res
}
-define <8 x bfloat> @test_int_x86_avx10_maskz_sub_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_maskz_sub_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_maskz_sub_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_maskz_sub_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vsubnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5c,0xc2]
-; X64-NEXT: vsubnepbf16 (%rsi), %xmm1, %xmm1 # encoding: [0x62,0xf5,0x75,0x08,0x5c,0x0e]
-; X64-NEXT: vsubnepbf16 %xmm1, %xmm0, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x5c,0xc1]
+; X64-NEXT: vsubbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5c,0xc2]
+; X64-NEXT: vsubbf16 (%rsi), %xmm1, %xmm1 # encoding: [0x62,0xf5,0x75,0x08,0x5c,0x0e]
+; X64-NEXT: vsubbf16 %xmm1, %xmm0, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x5c,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_sub_nepbf16_128:
+; X86-LABEL: test_int_x86_avx10_maskz_sub_bf16_128:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08]
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vsubnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5c,0xc2]
-; X86-NEXT: vsubnepbf16 (%eax), %xmm1, %xmm1 # encoding: [0x62,0xf5,0x75,0x08,0x5c,0x08]
-; X86-NEXT: vsubnepbf16 %xmm1, %xmm0, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x5c,0xc1]
+; X86-NEXT: vsubbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5c,0xc2]
+; X86-NEXT: vsubbf16 (%eax), %xmm1, %xmm1 # encoding: [0x62,0xf5,0x75,0x08,0x5c,0x08]
+; X86-NEXT: vsubbf16 %xmm1, %xmm0, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x5c,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i8 %msk to <8 x i1>
%val = load <8 x bfloat>, ptr %ptr
@@ -217,26 +217,26 @@ define <8 x bfloat> @test_int_x86_avx10_maskz_sub_nepbf16_128(<8 x bfloat> %src,
ret <8 x bfloat> %res3
}
-define <16 x bfloat> @test_int_x86_avx10_mul_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_mul_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_mul_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_mul_bf16_256:
; CHECK: # %bb.0:
-; CHECK-NEXT: vmulnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x59,0xc1]
+; CHECK-NEXT: vmulbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x59,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%res = fmul <16 x bfloat> %x1, %x2
ret <16 x bfloat> %res
}
-define <16 x bfloat> @test_int_x86_avx10_mask_mul_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_mask_mul_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_mask_mul_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_mask_mul_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vmulnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x59,0xc2]
+; X64-NEXT: vmulbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x59,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_mask_mul_nepbf16_256:
+; X86-LABEL: test_int_x86_avx10_mask_mul_bf16_256:
; X86: # %bb.0:
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vmulnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x59,0xc2]
+; X86-NEXT: vmulbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x59,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i16 %msk to <16 x i1>
%res0 = fmul <16 x bfloat> %x1, %x2
@@ -244,22 +244,22 @@ define <16 x bfloat> @test_int_x86_avx10_mask_mul_nepbf16_256(<16 x bfloat> %src
ret <16 x bfloat> %res
}
-define <16 x bfloat> @test_int_x86_avx10_maskz_mul_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_maskz_mul_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_maskz_mul_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_maskz_mul_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vmulnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0xc2]
-; X64-NEXT: vmulnepbf16 (%rsi), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0x0e]
-; X64-NEXT: vmulnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x59,0xc1]
+; X64-NEXT: vmulbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0xc2]
+; X64-NEXT: vmulbf16 (%rsi), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0x0e]
+; X64-NEXT: vmulbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x59,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_mul_nepbf16_256:
+; X86-LABEL: test_int_x86_avx10_maskz_mul_bf16_256:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08]
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vmulnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0xc2]
-; X86-NEXT: vmulnepbf16 (%eax), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0x08]
-; X86-NEXT: vmulnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x59,0xc1]
+; X86-NEXT: vmulbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0xc2]
+; X86-NEXT: vmulbf16 (%eax), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0x08]
+; X86-NEXT: vmulbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x59,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i16 %msk to <16 x i1>
%val = load <16 x bfloat>, ptr %ptr
@@ -271,26 +271,26 @@ define <16 x bfloat> @test_int_x86_avx10_maskz_mul_nepbf16_256(<16 x bfloat> %sr
ret <16 x bfloat> %res3
}
-define <8 x bfloat> @test_int_x86_avx10_mul_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_mul_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_mul_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_mul_bf16_128:
; CHECK: # %bb.0:
-; CHECK-NEXT: vmulnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x59,0xc1]
+; CHECK-NEXT: vmulbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x59,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%res = fmul <8 x bfloat> %x1, %x2
ret <8 x bfloat> %res
}
-define <8 x bfloat> @test_int_x86_avx10_mask_mul_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_mask_mul_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_mask_mul_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_mask_mul_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vmulnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x59,0xc2]
+; X64-NEXT: vmulbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x59,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_mask_mul_nepbf16_128:
+; X86-LABEL: test_int_x86_avx10_mask_mul_bf16_128:
; X86: # %bb.0:
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vmulnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x59,0xc2]
+; X86-NEXT: vmulbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x59,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i8 %msk to <8 x i1>
%res0 = fmul <8 x bfloat> %x1, %x2
@@ -298,22 +298,22 @@ define <8 x bfloat> @test_int_x86_avx10_mask_mul_nepbf16_128(<8 x bfloat> %src,
ret <8 x bfloat> %res
}
-define <8 x bfloat> @test_int_x86_avx10_maskz_mul_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_maskz_mul_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_maskz_mul_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_maskz_mul_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vmulnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0xc2]
-; X64-NEXT: vmulnepbf16 (%rsi), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0x0e]
-; X64-NEXT: vmulnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x59,0xc1]
+; X64-NEXT: vmulbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0xc2]
+; X64-NEXT: vmulbf16 (%rsi), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0x0e]
+; X64-NEXT: vmulbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x59,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_mul_nepbf16_128:
+; X86-LABEL: test_int_x86_avx10_maskz_mul_bf16_128:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08]
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vmulnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0xc2]
-; X86-NEXT: vmulnepbf16 (%eax), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0x08]
-; X86-NEXT: vmulnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x59,0xc1]
+; X86-NEXT: vmulbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0xc2]
+; X86-NEXT: vmulbf16 (%eax), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0x08]
+; X86-NEXT: vmulbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x59,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i8 %msk to <8 x i1>
%val = load <8 x bfloat>, ptr %ptr
@@ -325,26 +325,26 @@ define <8 x bfloat> @test_int_x86_avx10_maskz_mul_nepbf16_128(<8 x bfloat> %src,
ret <8 x bfloat> %res3
}
-define <16 x bfloat> @test_int_x86_avx10_div_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_div_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_div_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_div_bf16_256:
; CHECK: # %bb.0:
-; CHECK-NEXT: vdivnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5e,0xc1]
+; CHECK-NEXT: vdivbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5e,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%res = fdiv <16 x bfloat> %x1, %x2
ret <16 x bfloat> %res
}
-define <16 x bfloat> @test_int_x86_avx10_mask_div_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_mask_div_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_mask_div_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_mask_div_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vdivnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5e,0xc2]
+; X64-NEXT: vdivbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5e,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_mask_div_nepbf16_256:
+; X86-LABEL: test_int_x86_avx10_mask_div_bf16_256:
; X86: # %bb.0:
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vdivnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5e,0xc2]
+; X86-NEXT: vdivbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5e,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i16 %msk to <16 x i1>
%res0 = fdiv <16 x bfloat> %x1, %x2
@@ -353,22 +353,22 @@ define <16 x bfloat> @test_int_x86_avx10_mask_div_nepbf16_256(<16 x bfloat> %src
}
; FIXME: assembly order is different from fp16 ones
-define <16 x bfloat> @test_int_x86_avx10_maskz_div_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_maskz_div_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_maskz_div_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_maskz_div_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vdivnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0xc2]
-; X64-NEXT: vdivnepbf16 (%rsi), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0x0e]
-; X64-NEXT: vdivnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5e,0xc1]
+; X64-NEXT: vdivbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0xc2]
+; X64-NEXT: vdivbf16 (%rsi), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0x0e]
+; X64-NEXT: vdivbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5e,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_div_nepbf16_256:
+; X86-LABEL: test_int_x86_avx10_maskz_div_bf16_256:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08]
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vdivnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0xc2]
-; X86-NEXT: vdivnepbf16 (%eax), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0x08]
-; X86-NEXT: vdivnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5e,0xc1]
+; X86-NEXT: vdivbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0xc2]
+; X86-NEXT: vdivbf16 (%eax), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0x08]
+; X86-NEXT: vdivbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5e,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i16 %msk to <16 x i1>
%val = load <16 x bfloat>, ptr %ptr
@@ -380,26 +380,26 @@ define <16 x bfloat> @test_int_x86_avx10_maskz_div_nepbf16_256(<16 x bfloat> %sr
ret <16 x bfloat> %res3
}
-define <8 x bfloat> @test_int_x86_avx10_div_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_div_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_div_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_div_bf16_128:
; CHECK: # %bb.0:
-; CHECK-NEXT: vdivnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5e,0xc1]
+; CHECK-NEXT: vdivbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5e,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%res = fdiv <8 x bfloat> %x1, %x2
ret <8 x bfloat> %res
}
-define <8 x bfloat> @test_int_x86_avx10_mask_div_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_mask_div_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_mask_div_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_mask_div_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vdivnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5e,0xc2]
+; X64-NEXT: vdivbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5e,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_mask_div_nepbf16_128:
+; X86-LABEL: test_int_x86_avx10_mask_div_bf16_128:
; X86: # %bb.0:
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vdivnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5e,0xc2]
+; X86-NEXT: vdivbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5e,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i8 %msk to <8 x i1>
%res0 = fdiv <8 x bfloat> %x1, %x2
@@ -408,22 +408,22 @@ define <8 x bfloat> @test_int_x86_avx10_mask_div_nepbf16_128(<8 x bfloat> %src,
}
; FIXME: assembly order is different from fp16 ones
-define <8 x bfloat> @test_int_x86_avx10_maskz_div_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
-; X64-LABEL: test_int_x86_avx10_maskz_div_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_maskz_div_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) {
+; X64-LABEL: test_int_x86_avx10_maskz_div_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vdivnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0xc2]
-; X64-NEXT: vdivnepbf16 (%rsi), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0x0e]
-; X64-NEXT: vdivnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5e,0xc1]
+; X64-NEXT: vdivbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0xc2]
+; X64-NEXT: vdivbf16 (%rsi), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0x0e]
+; X64-NEXT: vdivbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5e,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_div_nepbf16_128:
+; X86-LABEL: test_int_x86_avx10_maskz_div_bf16_128:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08]
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vdivnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0xc2]
-; X86-NEXT: vdivnepbf16 (%eax), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0x08]
-; X86-NEXT: vdivnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5e,0xc1]
+; X86-NEXT: vdivbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0xc2]
+; X86-NEXT: vdivbf16 (%eax), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0x08]
+; X86-NEXT: vdivbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5e,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i8 %msk to <8 x i1>
%val = load <8 x bfloat>, ptr %ptr
@@ -435,10 +435,10 @@ define <8 x bfloat> @test_int_x86_avx10_maskz_div_nepbf16_128(<8 x bfloat> %src,
ret <8 x bfloat> %res3
}
-define i16 @test_int_x86_avx10_vcmppbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_vcmppbf16256:
+define i16 @test_int_x86_avx10_vcmpbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_vcmpbf16256:
; CHECK: # %bb.0:
-; CHECK-NEXT: vcmpunordpbf16 %ymm1, %ymm0, %k0 # encoding: [0x62,0xf3,0x7f,0x28,0xc2,0xc1,0x03]
+; CHECK-NEXT: vcmpunordbf16 %ymm1, %ymm0, %k0 # encoding: [0x62,0xf3,0x7f,0x28,0xc2,0xc1,0x03]
; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0]
; CHECK-NEXT: # kill: def $ax killed $ax killed $eax
; CHECK-NEXT: vzeroupper # encoding: [0xc5,0xf8,0x77]
@@ -448,10 +448,10 @@ define i16 @test_int_x86_avx10_vcmppbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2
ret i16 %res
}
-define i16 @test_int_x86_avx10_vcmppbf16256_mask2(<16 x bfloat> %x1, <16 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_vcmppbf16256_mask2:
+define i16 @test_int_x86_avx10_vcmpbf16256_mask2(<16 x bfloat> %x1, <16 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_vcmpbf16256_mask2:
; CHECK: # %bb.0:
-; CHECK-NEXT: vcmpeqpbf16 %ymm1, %ymm0, %k0 # encoding: [0x62,0xf3,0x7f,0x28,0xc2,0xc1,0x00]
+; CHECK-NEXT: vcmpeqbf16 %ymm1, %ymm0, %k0 # encoding: [0x62,0xf3,0x7f,0x28,0xc2,0xc1,0x00]
; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0]
; CHECK-NEXT: andl $3, %eax # encoding: [0x83,0xe0,0x03]
; CHECK-NEXT: # kill: def $ax killed $ax killed $eax
@@ -463,10 +463,10 @@ define i16 @test_int_x86_avx10_vcmppbf16256_mask2(<16 x bfloat> %x1, <16 x bfloa
ret i16 %3
}
-define i8 @test_int_x86_avx10_vcmppbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_vcmppbf16128:
+define i8 @test_int_x86_avx10_vcmpbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_vcmpbf16128:
; CHECK: # %bb.0:
-; CHECK-NEXT: vcmpunordpbf16 %xmm1, %xmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x08,0xc2,0xc1,0x03]
+; CHECK-NEXT: vcmpunordbf16 %xmm1, %xmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x08,0xc2,0xc1,0x03]
; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0]
; CHECK-NEXT: # kill: def $al killed $al killed $eax
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
@@ -475,10 +475,10 @@ define i8 @test_int_x86_avx10_vcmppbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
ret i8 %res
}
-define i8 @test_int_x86_avx10_vcmppbf16128_mask2(<8 x bfloat> %x1, <8 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_vcmppbf16128_mask2:
+define i8 @test_int_x86_avx10_vcmpbf16128_mask2(<8 x bfloat> %x1, <8 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_vcmpbf16128_mask2:
; CHECK: # %bb.0:
-; CHECK-NEXT: vcmpeqpbf16 %xmm1, %xmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x08,0xc2,0xc1,0x00]
+; CHECK-NEXT: vcmpeqbf16 %xmm1, %xmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x08,0xc2,0xc1,0x00]
; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0]
; CHECK-NEXT: andb $3, %al # encoding: [0x24,0x03]
; CHECK-NEXT: # kill: def $al killed $al killed $eax
@@ -489,10 +489,10 @@ define i8 @test_int_x86_avx10_vcmppbf16128_mask2(<8 x bfloat> %x1, <8 x bfloat>
ret i8 %3
}
-define <16 x bfloat> @test_sqrt_nepbf16_256(<16 x bfloat> %a0) {
-; CHECK-LABEL: test_sqrt_nepbf16_256:
+define <16 x bfloat> @test_sqrt_bf16_256(<16 x bfloat> %a0) {
+; CHECK-LABEL: test_sqrt_bf16_256:
; CHECK: # %bb.0:
-; CHECK-NEXT: vsqrtnepbf16 %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x51,0xc0]
+; CHECK-NEXT: vsqrtbf16 %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x51,0xc0]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%1 = tail call <16 x bfloat> @llvm.sqrt.v16bf16(<16 x bfloat> %a0)
ret <16 x bfloat> %1
@@ -502,13 +502,13 @@ define <16 x bfloat> @test_mm256_mask_sqrt_pbh(<16 x bfloat> %__W, i16 %__U, <16
; X64-LABEL: test_mm256_mask_sqrt_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vsqrtnepbf16 %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x51,0xc1]
+; X64-NEXT: vsqrtbf16 %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x51,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm256_mask_sqrt_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vsqrtnepbf16 %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x51,0xc1]
+; X86-NEXT: vsqrtbf16 %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x51,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%0 = tail call <16 x bfloat> @llvm.sqrt.v16bf16(<16 x bfloat> %__A)
@@ -521,13 +521,13 @@ define <16 x bfloat> @test_mm256_maskz_sqrt_pbh(i16 %__U, <16 x bfloat>%__A) {
; X64-LABEL: test_mm256_maskz_sqrt_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vsqrtnepbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x51,0xc0]
+; X64-NEXT: vsqrtbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x51,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm256_maskz_sqrt_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vsqrtnepbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x51,0xc0]
+; X86-NEXT: vsqrtbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x51,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%0 = tail call <16 x bfloat> @llvm.sqrt.v16bf16(<16 x bfloat> %__A)
@@ -536,10 +536,10 @@ entry:
ret <16 x bfloat> %2
}
-define <8 x bfloat> @test_sqrt_nepbf16_128(<8 x bfloat> %a0) {
-; CHECK-LABEL: test_sqrt_nepbf16_128:
+define <8 x bfloat> @test_sqrt_bf16_128(<8 x bfloat> %a0) {
+; CHECK-LABEL: test_sqrt_bf16_128:
; CHECK: # %bb.0:
-; CHECK-NEXT: vsqrtnepbf16 %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x51,0xc0]
+; CHECK-NEXT: vsqrtbf16 %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x51,0xc0]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
%1 = tail call <8 x bfloat> @llvm.sqrt.v8bf16(<8 x bfloat> %a0)
ret <8 x bfloat> %1
@@ -549,13 +549,13 @@ define <8 x bfloat> @test_mm_mask_sqrt_pbh(<8 x bfloat> %__W, i8 %__U, <8 x bflo
; X64-LABEL: test_mm_mask_sqrt_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vsqrtnepbf16 %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x51,0xc1]
+; X64-NEXT: vsqrtbf16 %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x51,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm_mask_sqrt_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vsqrtnepbf16 %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x51,0xc1]
+; X86-NEXT: vsqrtbf16 %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x51,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%0 = tail call <8 x bfloat> @llvm.sqrt.v8bf16(<8 x bfloat> %__A)
@@ -568,13 +568,13 @@ define <8 x bfloat> @test_mm_maskz_sqrt_pbh(i8 %__U, <8 x bfloat>%__A) {
; X64-LABEL: test_mm_maskz_sqrt_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vsqrtnepbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x51,0xc0]
+; X64-NEXT: vsqrtbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x51,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm_maskz_sqrt_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vsqrtnepbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x51,0xc0]
+; X86-NEXT: vsqrtbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x51,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%0 = tail call <8 x bfloat> @llvm.sqrt.v8bf16(<8 x bfloat> %__A)
@@ -586,7 +586,7 @@ entry:
define <16 x bfloat> @test_mm256_fmaddne_pbh(<16 x bfloat> %__A, <16 x bfloat> %__B, <16 x bfloat> %__C) {
; CHECK-LABEL: test_mm256_fmaddne_pbh:
; CHECK: # %bb.0: # %entry
-; CHECK-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xa8,0xc2]
+; CHECK-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xa8,0xc2]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
entry:
%0 = tail call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %__A, <16 x bfloat> %__B, <16 x bfloat> %__C)
@@ -597,13 +597,13 @@ define <16 x bfloat> @test_mm256_mask_fmaddne_pbh(<16 x bfloat> %__A, i16 zeroex
; X64-LABEL: test_mm256_mask_fmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmadd132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x98,0xc1]
+; X64-NEXT: vfmadd132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x98,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm256_mask_fmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmadd132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x98,0xc1]
+; X86-NEXT: vfmadd132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x98,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%0 = tail call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %__A, <16 x bfloat> %__B, <16 x bfloat> %__C)
@@ -616,14 +616,14 @@ define <16 x bfloat> @test_mm256_mask3_fmaddne_pbh(<16 x bfloat> %__A, <16 x bfl
; X64-LABEL: test_mm256_mask3_fmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmadd231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xb8,0xd1]
+; X64-NEXT: vfmadd231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xb8,0xd1]
; X64-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm256_mask3_fmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmadd231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xb8,0xd1]
+; X86-NEXT: vfmadd231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xb8,0xd1]
; X86-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
@@ -637,13 +637,13 @@ define <16 x bfloat> @test_mm256_maskz_fmaddne_pbh(i16 zeroext %__U, <16 x bfloa
; X64-LABEL: test_mm256_maskz_fmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xa8,0xc2]
+; X64-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xa8,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm256_maskz_fmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xa8,0xc2]
+; X86-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xa8,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%0 = tail call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %__A, <16 x bfloat> %__B, <16 x bfloat> %__C)
@@ -655,7 +655,7 @@ entry:
define <16 x bfloat> @test_mm256_fmsubne_pbh(<16 x bfloat> %__A, <16 x bfloat> %__B, <16 x bfloat> %__C) {
; CHECK-LABEL: test_mm256_fmsubne_pbh:
; CHECK: # %bb.0: # %entry
-; CHECK-NEXT: vfmsub213nepbf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xaa,0xc2]
+; CHECK-NEXT: vfmsub213bf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xaa,0xc2]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
entry:
%fneg.i = fneg <16 x bfloat> %__C
@@ -667,13 +667,13 @@ define <16 x bfloat> @test_mm256_mask_fmsubne_pbh(<16 x bfloat> %__A, i16 zeroex
; X64-LABEL: test_mm256_mask_fmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmsub132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9a,0xc1]
+; X64-NEXT: vfmsub132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9a,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm256_mask_fmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmsub132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9a,0xc1]
+; X86-NEXT: vfmsub132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9a,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <16 x bfloat> %__C
@@ -687,14 +687,14 @@ define <16 x bfloat> @test_mm256_mask3_fmsubne_pbh(<16 x bfloat> %__A, <16 x bfl
; X64-LABEL: test_mm256_mask3_fmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmsub231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xba,0xd1]
+; X64-NEXT: vfmsub231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xba,0xd1]
; X64-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm256_mask3_fmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmsub231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xba,0xd1]
+; X86-NEXT: vfmsub231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xba,0xd1]
; X86-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
@@ -709,13 +709,13 @@ define <16 x bfloat> @test_mm256_maskz_fmsubne_pbh(i16 zeroext %__U, <16 x bfloa
; X64-LABEL: test_mm256_maskz_fmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmsub213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xaa,0xc2]
+; X64-NEXT: vfmsub213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xaa,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm256_maskz_fmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmsub213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xaa,0xc2]
+; X86-NEXT: vfmsub213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xaa,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <16 x bfloat> %__C
@@ -728,7 +728,7 @@ entry:
define <16 x bfloat> @test_mm256_fnmaddne_pbh(<16 x bfloat> %__A, <16 x bfloat> %__B, <16 x bfloat> %__C) {
; CHECK-LABEL: test_mm256_fnmaddne_pbh:
; CHECK: # %bb.0: # %entry
-; CHECK-NEXT: vfnmadd213nepbf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xac,0xc2]
+; CHECK-NEXT: vfnmadd213bf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xac,0xc2]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
entry:
%fneg.i = fneg <16 x bfloat> %__B
@@ -740,13 +740,13 @@ define <16 x bfloat> @test_mm256_mask_fnmaddne_pbh(<16 x bfloat> %__A, i16 zeroe
; X64-LABEL: test_mm256_mask_fnmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmadd132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9c,0xc1]
+; X64-NEXT: vfnmadd132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9c,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm256_mask_fnmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmadd132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9c,0xc1]
+; X86-NEXT: vfnmadd132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9c,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <16 x bfloat> %__B
@@ -760,14 +760,14 @@ define <16 x bfloat> @test_mm256_mask3_fnmaddne_pbh(<16 x bfloat> %__A, <16 x bf
; X64-LABEL: test_mm256_mask3_fnmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmadd231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbc,0xd1]
+; X64-NEXT: vfnmadd231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbc,0xd1]
; X64-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm256_mask3_fnmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmadd231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbc,0xd1]
+; X86-NEXT: vfnmadd231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbc,0xd1]
; X86-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
@@ -782,13 +782,13 @@ define <16 x bfloat> @test_mm256_maskz_fnmaddne_pbh(i16 zeroext %__U, <16 x bflo
; X64-LABEL: test_mm256_maskz_fnmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmadd213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xac,0xc2]
+; X64-NEXT: vfnmadd213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xac,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm256_maskz_fnmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmadd213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xac,0xc2]
+; X86-NEXT: vfnmadd213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xac,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <16 x bfloat> %__B
@@ -801,7 +801,7 @@ entry:
define <16 x bfloat> @test_mm256_fnmsubne_pbh(<16 x bfloat> %__A, <16 x bfloat> %__B, <16 x bfloat> %__C) {
; CHECK-LABEL: test_mm256_fnmsubne_pbh:
; CHECK: # %bb.0: # %entry
-; CHECK-NEXT: vfnmsub213nepbf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xae,0xc2]
+; CHECK-NEXT: vfnmsub213bf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xae,0xc2]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
entry:
%fneg.i = fneg <16 x bfloat> %__B
@@ -814,13 +814,13 @@ define <16 x bfloat> @test_mm256_mask_fnmsubne_pbh(<16 x bfloat> %__A, i16 zeroe
; X64-LABEL: test_mm256_mask_fnmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmsub132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9e,0xc1]
+; X64-NEXT: vfnmsub132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9e,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm256_mask_fnmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmsub132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9e,0xc1]
+; X86-NEXT: vfnmsub132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9e,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <16 x bfloat> %__B
@@ -835,14 +835,14 @@ define <16 x bfloat> @test_mm256_mask3_fnmsubne_pbh(<16 x bfloat> %__A, <16 x bf
; X64-LABEL: test_mm256_mask3_fnmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmsub231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbe,0xd1]
+; X64-NEXT: vfnmsub231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbe,0xd1]
; X64-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm256_mask3_fnmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmsub231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbe,0xd1]
+; X86-NEXT: vfnmsub231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbe,0xd1]
; X86-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
@@ -858,13 +858,13 @@ define <16 x bfloat> @test_mm256_maskz_fnmsubne_pbh(i16 zeroext %__U, <16 x bflo
; X64-LABEL: test_mm256_maskz_fnmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmsub213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xae,0xc2]
+; X64-NEXT: vfnmsub213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xae,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm256_maskz_fnmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmsub213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xae,0xc2]
+; X86-NEXT: vfnmsub213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xae,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <16 x bfloat> %__B
@@ -878,7 +878,7 @@ entry:
define <8 x bfloat> @test_mm_fmaddne_pbh(<8 x bfloat> %__A, <8 x bfloat> %__B, <8 x bfloat> %__C) {
; CHECK-LABEL: test_mm_fmaddne_pbh:
; CHECK: # %bb.0: # %entry
-; CHECK-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xa8,0xc2]
+; CHECK-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xa8,0xc2]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
entry:
%0 = tail call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %__A, <8 x bfloat> %__B, <8 x bfloat> %__C)
@@ -889,13 +889,13 @@ define <8 x bfloat> @test_mm_mask_fmaddne_pbh(<8 x bfloat> %__A, i8 zeroext %__U
; X64-LABEL: test_mm_mask_fmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmadd132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x98,0xc1]
+; X64-NEXT: vfmadd132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x98,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm_mask_fmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmadd132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x98,0xc1]
+; X86-NEXT: vfmadd132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x98,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%0 = tail call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %__A, <8 x bfloat> %__B, <8 x bfloat> %__C)
@@ -908,14 +908,14 @@ define <8 x bfloat> @test_mm_mask3_fmaddne_pbh(<8 x bfloat> %__A, <8 x bfloat> %
; X64-LABEL: test_mm_mask3_fmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmadd231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xb8,0xd1]
+; X64-NEXT: vfmadd231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xb8,0xd1]
; X64-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm_mask3_fmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmadd231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xb8,0xd1]
+; X86-NEXT: vfmadd231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xb8,0xd1]
; X86-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
@@ -929,13 +929,13 @@ define <8 x bfloat> @test_mm_maskz_fmaddne_pbh(i8 zeroext %__U, <8 x bfloat> %__
; X64-LABEL: test_mm_maskz_fmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xa8,0xc2]
+; X64-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xa8,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm_maskz_fmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xa8,0xc2]
+; X86-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xa8,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%0 = tail call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %__A, <8 x bfloat> %__B, <8 x bfloat> %__C)
@@ -947,7 +947,7 @@ entry:
define <8 x bfloat> @test_mm_fmsubne_pbh(<8 x bfloat> %__A, <8 x bfloat> %__B, <8 x bfloat> %__C) {
; CHECK-LABEL: test_mm_fmsubne_pbh:
; CHECK: # %bb.0: # %entry
-; CHECK-NEXT: vfmsub213nepbf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xaa,0xc2]
+; CHECK-NEXT: vfmsub213bf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xaa,0xc2]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
entry:
%fneg.i = fneg <8 x bfloat> %__C
@@ -959,13 +959,13 @@ define <8 x bfloat> @test_mm_mask_fmsubne_pbh(<8 x bfloat> %__A, i8 zeroext %__U
; X64-LABEL: test_mm_mask_fmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmsub132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9a,0xc1]
+; X64-NEXT: vfmsub132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9a,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm_mask_fmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmsub132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9a,0xc1]
+; X86-NEXT: vfmsub132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9a,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <8 x bfloat> %__C
@@ -979,14 +979,14 @@ define <8 x bfloat> @test_mm_mask3_fmsubne_pbh(<8 x bfloat> %__A, <8 x bfloat> %
; X64-LABEL: test_mm_mask3_fmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmsub231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xba,0xd1]
+; X64-NEXT: vfmsub231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xba,0xd1]
; X64-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm_mask3_fmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmsub231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xba,0xd1]
+; X86-NEXT: vfmsub231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xba,0xd1]
; X86-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
@@ -1001,13 +1001,13 @@ define <8 x bfloat> @test_mm_maskz_fmsubne_pbh(i8 zeroext %__U, <8 x bfloat> %__
; X64-LABEL: test_mm_maskz_fmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfmsub213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xaa,0xc2]
+; X64-NEXT: vfmsub213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xaa,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm_maskz_fmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfmsub213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xaa,0xc2]
+; X86-NEXT: vfmsub213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xaa,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <8 x bfloat> %__C
@@ -1020,7 +1020,7 @@ entry:
define <8 x bfloat> @test_mm_fnmaddne_pbh(<8 x bfloat> %__A, <8 x bfloat> %__B, <8 x bfloat> %__C) {
; CHECK-LABEL: test_mm_fnmaddne_pbh:
; CHECK: # %bb.0: # %entry
-; CHECK-NEXT: vfnmadd213nepbf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xac,0xc2]
+; CHECK-NEXT: vfnmadd213bf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xac,0xc2]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
entry:
%fneg.i = fneg <8 x bfloat> %__B
@@ -1032,13 +1032,13 @@ define <8 x bfloat> @test_mm_mask_fnmaddne_pbh(<8 x bfloat> %__A, i8 zeroext %__
; X64-LABEL: test_mm_mask_fnmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmadd132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9c,0xc1]
+; X64-NEXT: vfnmadd132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9c,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm_mask_fnmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmadd132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9c,0xc1]
+; X86-NEXT: vfnmadd132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9c,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <8 x bfloat> %__B
@@ -1052,14 +1052,14 @@ define <8 x bfloat> @test_mm_mask3_fnmaddne_pbh(<8 x bfloat> %__A, <8 x bfloat>
; X64-LABEL: test_mm_mask3_fnmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmadd231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbc,0xd1]
+; X64-NEXT: vfnmadd231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbc,0xd1]
; X64-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm_mask3_fnmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmadd231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbc,0xd1]
+; X86-NEXT: vfnmadd231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbc,0xd1]
; X86-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
@@ -1074,13 +1074,13 @@ define <8 x bfloat> @test_mm_maskz_fnmaddne_pbh(i8 zeroext %__U, <8 x bfloat> %_
; X64-LABEL: test_mm_maskz_fnmaddne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmadd213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xac,0xc2]
+; X64-NEXT: vfnmadd213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xac,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm_maskz_fnmaddne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmadd213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xac,0xc2]
+; X86-NEXT: vfnmadd213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xac,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <8 x bfloat> %__B
@@ -1093,7 +1093,7 @@ entry:
define <8 x bfloat> @test_mm_fnmsubne_pbh(<8 x bfloat> %__A, <8 x bfloat> %__B, <8 x bfloat> %__C) {
; CHECK-LABEL: test_mm_fnmsubne_pbh:
; CHECK: # %bb.0: # %entry
-; CHECK-NEXT: vfnmsub213nepbf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xae,0xc2]
+; CHECK-NEXT: vfnmsub213bf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xae,0xc2]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
entry:
%fneg.i = fneg <8 x bfloat> %__B
@@ -1106,13 +1106,13 @@ define <8 x bfloat> @test_mm_mask_fnmsubne_pbh(<8 x bfloat> %__A, i8 zeroext %__
; X64-LABEL: test_mm_mask_fnmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmsub132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9e,0xc1]
+; X64-NEXT: vfnmsub132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9e,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm_mask_fnmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmsub132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9e,0xc1]
+; X86-NEXT: vfnmsub132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9e,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <8 x bfloat> %__B
@@ -1127,14 +1127,14 @@ define <8 x bfloat> @test_mm_mask3_fnmsubne_pbh(<8 x bfloat> %__A, <8 x bfloat>
; X64-LABEL: test_mm_mask3_fnmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmsub231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbe,0xd1]
+; X64-NEXT: vfnmsub231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbe,0xd1]
; X64-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm_mask3_fnmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmsub231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbe,0xd1]
+; X86-NEXT: vfnmsub231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbe,0xd1]
; X86-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
@@ -1150,13 +1150,13 @@ define <8 x bfloat> @test_mm_maskz_fnmsubne_pbh(i8 zeroext %__U, <8 x bfloat> %_
; X64-LABEL: test_mm_maskz_fnmsubne_pbh:
; X64: # %bb.0: # %entry
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vfnmsub213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xae,0xc2]
+; X64-NEXT: vfnmsub213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xae,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: test_mm_maskz_fnmsubne_pbh:
; X86: # %bb.0: # %entry
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vfnmsub213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xae,0xc2]
+; X86-NEXT: vfnmsub213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xae,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
entry:
%fneg.i.i = fneg <8 x bfloat> %__B
@@ -1170,8 +1170,8 @@ entry:
define <32 x bfloat> @addv(<32 x bfloat> %a, <32 x bfloat> %b) nounwind {
; X64-LABEL: addv:
; X64: # %bb.0:
-; X64-NEXT: vaddnepbf16 %ymm2, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc2]
-; X64-NEXT: vaddnepbf16 %ymm3, %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xcb]
+; X64-NEXT: vaddbf16 %ymm2, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc2]
+; X64-NEXT: vaddbf16 %ymm3, %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xcb]
; X64-NEXT: retq # encoding: [0xc3]
;
; X86-LABEL: addv:
@@ -1180,8 +1180,8 @@ define <32 x bfloat> @addv(<32 x bfloat> %a, <32 x bfloat> %b) nounwind {
; X86-NEXT: movl %esp, %ebp # encoding: [0x89,0xe5]
; X86-NEXT: andl $-32, %esp # encoding: [0x83,0xe4,0xe0]
; X86-NEXT: subl $32, %esp # encoding: [0x83,0xec,0x20]
-; X86-NEXT: vaddnepbf16 %ymm2, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc2]
-; X86-NEXT: vaddnepbf16 8(%ebp), %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x58,0x8d,0x08,0x00,0x00,0x00]
+; X86-NEXT: vaddbf16 %ymm2, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc2]
+; X86-NEXT: vaddbf16 8(%ebp), %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x58,0x8d,0x08,0x00,0x00,0x00]
; X86-NEXT: movl %ebp, %esp # encoding: [0x89,0xec]
; X86-NEXT: popl %ebp # encoding: [0x5d]
; X86-NEXT: retl # encoding: [0xc3]
diff --git a/llvm/test/CodeGen/X86/avx10_2bf16-intrinsics.ll b/llvm/test/CodeGen/X86/avx10_2bf16-intrinsics.ll
index 59151d4dd96099..f1146d5617f770 100644
--- a/llvm/test/CodeGen/X86/avx10_2bf16-intrinsics.ll
+++ b/llvm/test/CodeGen/X86/avx10_2bf16-intrinsics.ll
@@ -2,118 +2,118 @@
; RUN: llc < %s -verify-machineinstrs -mtriple=x86_64-unknown-unknown --show-mc-encoding -mattr=+avx10.2-256 | FileCheck %s --check-prefixes=CHECK,X64
; RUN: llc < %s -verify-machineinstrs -mtriple=i686-unknown-unknown --show-mc-encoding -mattr=+avx10.2-256 | FileCheck %s --check-prefixes=CHECK,X86
-declare <16 x bfloat> @llvm.x86.avx10.vminpbf16256(<16 x bfloat>, <16 x bfloat>)
+declare <16 x bfloat> @llvm.x86.avx10.vminbf16256(<16 x bfloat>, <16 x bfloat>)
-define <16 x bfloat> @test_int_x86_avx10_min_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_min_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_min_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_min_bf16_256:
; CHECK: # %bb.0:
-; CHECK-NEXT: vminpbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5d,0xc1]
+; CHECK-NEXT: vminbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5d,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res0 = call <16 x bfloat> @llvm.x86.avx10.vminpbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2)
+ %res0 = call <16 x bfloat> @llvm.x86.avx10.vminbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2)
ret <16 x bfloat> %res0
}
-define <16 x bfloat> @test_int_x86_avx10_maskz_min_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk) {
-; X64-LABEL: test_int_x86_avx10_maskz_min_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_maskz_min_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk) {
+; X64-LABEL: test_int_x86_avx10_maskz_min_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vminpbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5d,0xc1]
+; X64-NEXT: vminbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5d,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_min_nepbf16_256:
+; X86-LABEL: test_int_x86_avx10_maskz_min_bf16_256:
; X86: # %bb.0:
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vminpbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5d,0xc1]
+; X86-NEXT: vminbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5d,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i16 %msk to <16 x i1>
- %res0 = call <16 x bfloat> @llvm.x86.avx10.vminpbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2)
+ %res0 = call <16 x bfloat> @llvm.x86.avx10.vminbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2)
%res1 = select <16 x i1> %mask, <16 x bfloat> %res0, <16 x bfloat> zeroinitializer
ret <16 x bfloat> %res1
}
-declare <8 x bfloat> @llvm.x86.avx10.vminpbf16128(<8 x bfloat>, <8 x bfloat>)
+declare <8 x bfloat> @llvm.x86.avx10.vminbf16128(<8 x bfloat>, <8 x bfloat>)
-define <8 x bfloat> @test_int_x86_avx10_min_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_min_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_min_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_min_bf16_128:
; CHECK: # %bb.0:
-; CHECK-NEXT: vminpbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5d,0xc1]
+; CHECK-NEXT: vminbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5d,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res0 = call <8 x bfloat> @llvm.x86.avx10.vminpbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2)
+ %res0 = call <8 x bfloat> @llvm.x86.avx10.vminbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2)
ret <8 x bfloat> %res0
}
-define <8 x bfloat> @test_int_x86_avx10_maskz_min_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk) {
-; X64-LABEL: test_int_x86_avx10_maskz_min_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_maskz_min_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk) {
+; X64-LABEL: test_int_x86_avx10_maskz_min_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vminpbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5d,0xc1]
+; X64-NEXT: vminbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5d,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_min_nepbf16_128:
+; X86-LABEL: test_int_x86_avx10_maskz_min_bf16_128:
; X86: # %bb.0:
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vminpbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5d,0xc1]
+; X86-NEXT: vminbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5d,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i8 %msk to <8 x i1>
- %res0 = call <8 x bfloat> @llvm.x86.avx10.vminpbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2)
+ %res0 = call <8 x bfloat> @llvm.x86.avx10.vminbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2)
%res1 = select <8 x i1> %mask, <8 x bfloat> %res0, <8 x bfloat> zeroinitializer
ret <8 x bfloat> %res1
}
-declare <16 x bfloat> @llvm.x86.avx10.vmaxpbf16256(<16 x bfloat>, <16 x bfloat>)
+declare <16 x bfloat> @llvm.x86.avx10.vmaxbf16256(<16 x bfloat>, <16 x bfloat>)
-define <16 x bfloat> @test_int_x86_avx10_max_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_max_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_max_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_max_bf16_256:
; CHECK: # %bb.0:
-; CHECK-NEXT: vmaxpbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5f,0xc1]
+; CHECK-NEXT: vmaxbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5f,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res0 = call <16 x bfloat> @llvm.x86.avx10.vmaxpbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2)
+ %res0 = call <16 x bfloat> @llvm.x86.avx10.vmaxbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2)
ret <16 x bfloat> %res0
}
-define <16 x bfloat> @test_int_x86_avx10_maskz_max_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk) {
-; X64-LABEL: test_int_x86_avx10_maskz_max_nepbf16_256:
+define <16 x bfloat> @test_int_x86_avx10_maskz_max_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk) {
+; X64-LABEL: test_int_x86_avx10_maskz_max_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vmaxpbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5f,0xc1]
+; X64-NEXT: vmaxbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5f,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_max_nepbf16_256:
+; X86-LABEL: test_int_x86_avx10_maskz_max_bf16_256:
; X86: # %bb.0:
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vmaxpbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5f,0xc1]
+; X86-NEXT: vmaxbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5f,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i16 %msk to <16 x i1>
- %res0 = call <16 x bfloat> @llvm.x86.avx10.vmaxpbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2)
+ %res0 = call <16 x bfloat> @llvm.x86.avx10.vmaxbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2)
%res1 = select <16 x i1> %mask, <16 x bfloat> %res0, <16 x bfloat> zeroinitializer
ret <16 x bfloat> %res1
}
-declare <8 x bfloat> @llvm.x86.avx10.vmaxpbf16128(<8 x bfloat>, <8 x bfloat>)
+declare <8 x bfloat> @llvm.x86.avx10.vmaxbf16128(<8 x bfloat>, <8 x bfloat>)
-define <8 x bfloat> @test_int_x86_avx10_max_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
-; CHECK-LABEL: test_int_x86_avx10_max_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_max_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) {
+; CHECK-LABEL: test_int_x86_avx10_max_bf16_128:
; CHECK: # %bb.0:
-; CHECK-NEXT: vmaxpbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5f,0xc1]
+; CHECK-NEXT: vmaxbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5f,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res0 = call <8 x bfloat> @llvm.x86.avx10.vmaxpbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2)
+ %res0 = call <8 x bfloat> @llvm.x86.avx10.vmaxbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2)
ret <8 x bfloat> %res0
}
-define <8 x bfloat> @test_int_x86_avx10_maskz_max_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk) {
-; X64-LABEL: test_int_x86_avx10_maskz_max_nepbf16_128:
+define <8 x bfloat> @test_int_x86_avx10_maskz_max_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk) {
+; X64-LABEL: test_int_x86_avx10_maskz_max_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vmaxpbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5f,0xc1]
+; X64-NEXT: vmaxbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5f,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx10_maskz_max_nepbf16_128:
+; X86-LABEL: test_int_x86_avx10_maskz_max_bf16_128:
; X86: # %bb.0:
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vmaxpbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5f,0xc1]
+; X86-NEXT: vmaxbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5f,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i8 %msk to <8 x i1>
- %res0 = call <8 x bfloat> @llvm.x86.avx10.vmaxpbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2)
+ %res0 = call <8 x bfloat> @llvm.x86.avx10.vmaxbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2)
%res1 = select <8 x i1> %mask, <8 x bfloat> %res0, <8 x bfloat> zeroinitializer
ret <8 x bfloat> %res1
}
@@ -184,421 +184,421 @@ define i32 @test_x86_avx10_com_nesbf16_neq(<8 x bfloat> %a0, <8 x bfloat> %a1) {
ret i32 %res
}
-declare <8 x bfloat> @llvm.x86.avx10.mask.rsqrt.nepbf16.128(<8 x bfloat>, <8 x bfloat>, i8)
-declare <16 x bfloat> @llvm.x86.avx10.mask.rsqrt.nepbf16.256(<16 x bfloat>, <16 x bfloat>, i16)
+declare <8 x bfloat> @llvm.x86.avx10.mask.rsqrt.bf16.128(<8 x bfloat>, <8 x bfloat>, i8)
+declare <16 x bfloat> @llvm.x86.avx10.mask.rsqrt.bf16.256(<16 x bfloat>, <16 x bfloat>, i16)
-define <8 x bfloat> @test_rsqrt_nepbf16_128(<8 x bfloat> %a0) {
-; CHECK-LABEL: test_rsqrt_nepbf16_128:
+define <8 x bfloat> @test_rsqrt_bf16_128(<8 x bfloat> %a0) {
+; CHECK-LABEL: test_rsqrt_bf16_128:
; CHECK: # %bb.0:
-; CHECK-NEXT: vrsqrtpbf16 %xmm0, %xmm0 # encoding: [0x62,0xf6,0x7c,0x08,0x4e,0xc0]
+; CHECK-NEXT: vrsqrtbf16 %xmm0, %xmm0 # encoding: [0x62,0xf6,0x7c,0x08,0x4e,0xc0]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res = call <8 x bfloat> @llvm.x86.avx10.mask.rsqrt.nepbf16.128(<8 x bfloat> %a0, <8 x bfloat> zeroinitializer, i8 -1)
+ %res = call <8 x bfloat> @llvm.x86.avx10.mask.rsqrt.bf16.128(<8 x bfloat> %a0, <8 x bfloat> zeroinitializer, i8 -1)
ret <8 x bfloat> %res
}
-define <16 x bfloat> @test_rsqrt_nepbf16_256(<16 x bfloat> %a0) {
-; CHECK-LABEL: test_rsqrt_nepbf16_256:
+define <16 x bfloat> @test_rsqrt_bf16_256(<16 x bfloat> %a0) {
+; CHECK-LABEL: test_rsqrt_bf16_256:
; CHECK: # %bb.0:
-; CHECK-NEXT: vrsqrtpbf16 %ymm0, %ymm0 # encoding: [0x62,0xf6,0x7c,0x28,0x4e,0xc0]
+; CHECK-NEXT: vrsqrtbf16 %ymm0, %ymm0 # encoding: [0x62,0xf6,0x7c,0x28,0x4e,0xc0]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res = call <16 x bfloat> @llvm.x86.avx10.mask.rsqrt.nepbf16.256(<16 x bfloat> %a0, <16 x bfloat> zeroinitializer, i16 -1)
+ %res = call <16 x bfloat> @llvm.x86.avx10.mask.rsqrt.bf16.256(<16 x bfloat> %a0, <16 x bfloat> zeroinitializer, i16 -1)
ret <16 x bfloat> %res
}
-declare <8 x bfloat> @llvm.x86.avx10.mask.rcp.nepbf16.128(<8 x bfloat>, <8 x bfloat>, i8)
-declare <16 x bfloat> @llvm.x86.avx10.mask.rcp.nepbf16.256(<16 x bfloat>, <16 x bfloat>, i16)
+declare <8 x bfloat> @llvm.x86.avx10.mask.rcp.bf16.128(<8 x bfloat>, <8 x bfloat>, i8)
+declare <16 x bfloat> @llvm.x86.avx10.mask.rcp.bf16.256(<16 x bfloat>, <16 x bfloat>, i16)
-define <8 x bfloat> @test_rcp_nepbf16_128(<8 x bfloat> %a0, <8 x bfloat> %a1, i8 %mask) {
-; X64-LABEL: test_rcp_nepbf16_128:
+define <8 x bfloat> @test_rcp_bf16_128(<8 x bfloat> %a0, <8 x bfloat> %a1, i8 %mask) {
+; X64-LABEL: test_rcp_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vrcppbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x4c,0xc8]
+; X64-NEXT: vrcpbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x4c,0xc8]
; X64-NEXT: vmovaps %xmm1, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_rcp_nepbf16_128:
+; X86-LABEL: test_rcp_bf16_128:
; X86: # %bb.0:
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vrcppbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x4c,0xc8]
+; X86-NEXT: vrcpbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x4c,0xc8]
; X86-NEXT: vmovaps %xmm1, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <8 x bfloat> @llvm.x86.avx10.mask.rcp.nepbf16.128(<8 x bfloat> %a0, <8 x bfloat> %a1, i8 %mask)
+ %res = call <8 x bfloat> @llvm.x86.avx10.mask.rcp.bf16.128(<8 x bfloat> %a0, <8 x bfloat> %a1, i8 %mask)
ret <8 x bfloat> %res
}
-define <16 x bfloat> @test_rcp_nepbf16_256(<16 x bfloat> %a0, <16 x bfloat> %a1, i16 %mask) {
-; X64-LABEL: test_rcp_nepbf16_256:
+define <16 x bfloat> @test_rcp_bf16_256(<16 x bfloat> %a0, <16 x bfloat> %a1, i16 %mask) {
+; X64-LABEL: test_rcp_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vrcppbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x4c,0xc8]
+; X64-NEXT: vrcpbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x4c,0xc8]
; X64-NEXT: vmovaps %ymm1, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_rcp_nepbf16_256:
+; X86-LABEL: test_rcp_bf16_256:
; X86: # %bb.0:
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vrcppbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x4c,0xc8]
+; X86-NEXT: vrcpbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x4c,0xc8]
; X86-NEXT: vmovaps %ymm1, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <16 x bfloat> @llvm.x86.avx10.mask.rcp.nepbf16.256(<16 x bfloat> %a0, <16 x bfloat> %a1, i16 %mask)
+ %res = call <16 x bfloat> @llvm.x86.avx10.mask.rcp.bf16.256(<16 x bfloat> %a0, <16 x bfloat> %a1, i16 %mask)
ret <16 x bfloat> %res
}
-declare <8 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.128(<8 x bfloat>, i32, <8 x bfloat>, i8)
-declare <16 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.256(<16 x bfloat>, i32, <16 x bfloat>, i16)
+declare <8 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.128(<8 x bfloat>, i32, <8 x bfloat>, i8)
+declare <16 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.256(<16 x bfloat>, i32, <16 x bfloat>, i16)
-define <8 x bfloat>@test_int_x86_avx512_mask_reduce_nepbf16_128(<8 x bfloat> %x0, <8 x bfloat> %x2, i8 %x3) {
-; X64-LABEL: test_int_x86_avx512_mask_reduce_nepbf16_128:
+define <8 x bfloat>@test_int_x86_avx512_mask_reduce_bf16_128(<8 x bfloat> %x0, <8 x bfloat> %x2, i8 %x3) {
+; X64-LABEL: test_int_x86_avx512_mask_reduce_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vreducenepbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x56,0xc8,0x08]
-; X64-NEXT: vreducenepbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x56,0xc0,0x04]
-; X64-NEXT: vaddnepbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0]
+; X64-NEXT: vreducebf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x56,0xc8,0x08]
+; X64-NEXT: vreducebf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x56,0xc0,0x04]
+; X64-NEXT: vaddbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_reduce_nepbf16_128:
+; X86-LABEL: test_int_x86_avx512_mask_reduce_bf16_128:
; X86: # %bb.0:
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vreducenepbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x56,0xc8,0x08]
-; X86-NEXT: vreducenepbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x56,0xc0,0x04]
-; X86-NEXT: vaddnepbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0]
+; X86-NEXT: vreducebf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x56,0xc8,0x08]
+; X86-NEXT: vreducebf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x56,0xc0,0x04]
+; X86-NEXT: vaddbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <8 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.128(<8 x bfloat> %x0, i32 8, <8 x bfloat> %x2, i8 %x3)
- %res1 = call <8 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.128(<8 x bfloat> %x0, i32 4, <8 x bfloat> %x2, i8 -1)
+ %res = call <8 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.128(<8 x bfloat> %x0, i32 8, <8 x bfloat> %x2, i8 %x3)
+ %res1 = call <8 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.128(<8 x bfloat> %x0, i32 4, <8 x bfloat> %x2, i8 -1)
%res2 = fadd <8 x bfloat> %res, %res1
ret <8 x bfloat> %res2
}
-define <16 x bfloat>@test_int_x86_avx512_mask_reduce_nepbf16_256(<16 x bfloat> %x0, <16 x bfloat> %x2, i16 %x3) {
-; X64-LABEL: test_int_x86_avx512_mask_reduce_nepbf16_256:
+define <16 x bfloat>@test_int_x86_avx512_mask_reduce_bf16_256(<16 x bfloat> %x0, <16 x bfloat> %x2, i16 %x3) {
+; X64-LABEL: test_int_x86_avx512_mask_reduce_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vreducenepbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x56,0xc8,0x08]
-; X64-NEXT: vreducenepbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x56,0xc0,0x04]
-; X64-NEXT: vaddnepbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0]
+; X64-NEXT: vreducebf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x56,0xc8,0x08]
+; X64-NEXT: vreducebf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x56,0xc0,0x04]
+; X64-NEXT: vaddbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_reduce_nepbf16_256:
+; X86-LABEL: test_int_x86_avx512_mask_reduce_bf16_256:
; X86: # %bb.0:
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vreducenepbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x56,0xc8,0x08]
-; X86-NEXT: vreducenepbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x56,0xc0,0x04]
-; X86-NEXT: vaddnepbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0]
+; X86-NEXT: vreducebf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x56,0xc8,0x08]
+; X86-NEXT: vreducebf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x56,0xc0,0x04]
+; X86-NEXT: vaddbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <16 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.256(<16 x bfloat> %x0, i32 8, <16 x bfloat> %x2, i16 %x3)
- %res1 = call <16 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.256(<16 x bfloat> %x0, i32 4, <16 x bfloat> %x2, i16 -1)
+ %res = call <16 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.256(<16 x bfloat> %x0, i32 8, <16 x bfloat> %x2, i16 %x3)
+ %res1 = call <16 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.256(<16 x bfloat> %x0, i32 4, <16 x bfloat> %x2, i16 -1)
%res2 = fadd <16 x bfloat> %res, %res1
ret <16 x bfloat> %res2
}
-declare <8 x i1> @llvm.x86.avx10.fpclass.nepbf16.128(<8 x bfloat>, i32)
-declare <16 x i1> @llvm.x86.avx10.fpclass.nepbf16.256(<16 x bfloat>, i32)
+declare <8 x i1> @llvm.x86.avx10.fpclass.bf16.128(<8 x bfloat>, i32)
+declare <16 x i1> @llvm.x86.avx10.fpclass.bf16.256(<16 x bfloat>, i32)
-define i8 @test_int_x86_avx512_fpclass_nepbf16_128(<8 x bfloat> %x0) {
-; CHECK-LABEL: test_int_x86_avx512_fpclass_nepbf16_128:
+define i8 @test_int_x86_avx512_fpclass_bf16_128(<8 x bfloat> %x0) {
+; CHECK-LABEL: test_int_x86_avx512_fpclass_bf16_128:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfpclasspbf16 $2, %xmm0, %k1 # encoding: [0x62,0xf3,0x7f,0x08,0x66,0xc8,0x02]
+; CHECK-NEXT: vfpclassbf16 $2, %xmm0, %k1 # encoding: [0x62,0xf3,0x7f,0x08,0x66,0xc8,0x02]
; CHECK-NEXT: # k1 = isPositiveZero(xmm0)
-; CHECK-NEXT: vfpclasspbf16 $4, %xmm0, %k0 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x66,0xc0,0x04]
+; CHECK-NEXT: vfpclassbf16 $4, %xmm0, %k0 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x66,0xc0,0x04]
; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0]
; CHECK-NEXT: # kill: def $al killed $al killed $eax
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res = call <8 x i1> @llvm.x86.avx10.fpclass.nepbf16.128(<8 x bfloat> %x0, i32 4)
- %res1 = call <8 x i1> @llvm.x86.avx10.fpclass.nepbf16.128(<8 x bfloat> %x0, i32 2)
+ %res = call <8 x i1> @llvm.x86.avx10.fpclass.bf16.128(<8 x bfloat> %x0, i32 4)
+ %res1 = call <8 x i1> @llvm.x86.avx10.fpclass.bf16.128(<8 x bfloat> %x0, i32 2)
%1 = and <8 x i1> %res1, %res
%2 = bitcast <8 x i1> %1 to i8
ret i8 %2
}
-define i16 @test_int_x86_avx512_fpclass_nepbf16_256(<16 x bfloat> %x0) {
-; CHECK-LABEL: test_int_x86_avx512_fpclass_nepbf16_256:
+define i16 @test_int_x86_avx512_fpclass_bf16_256(<16 x bfloat> %x0) {
+; CHECK-LABEL: test_int_x86_avx512_fpclass_bf16_256:
; CHECK: # %bb.0:
-; CHECK-NEXT: vfpclasspbf16 $2, %ymm0, %k1 # encoding: [0x62,0xf3,0x7f,0x28,0x66,0xc8,0x02]
+; CHECK-NEXT: vfpclassbf16 $2, %ymm0, %k1 # encoding: [0x62,0xf3,0x7f,0x28,0x66,0xc8,0x02]
; CHECK-NEXT: # k1 = isPositiveZero(ymm0)
-; CHECK-NEXT: vfpclasspbf16 $4, %ymm0, %k0 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x66,0xc0,0x04]
+; CHECK-NEXT: vfpclassbf16 $4, %ymm0, %k0 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x66,0xc0,0x04]
; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0]
; CHECK-NEXT: # kill: def $ax killed $ax killed $eax
; CHECK-NEXT: vzeroupper # encoding: [0xc5,0xf8,0x77]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res = call <16 x i1> @llvm.x86.avx10.fpclass.nepbf16.256(<16 x bfloat> %x0, i32 4)
- %res1 = call <16 x i1> @llvm.x86.avx10.fpclass.nepbf16.256(<16 x bfloat> %x0, i32 2)
+ %res = call <16 x i1> @llvm.x86.avx10.fpclass.bf16.256(<16 x bfloat> %x0, i32 4)
+ %res1 = call <16 x i1> @llvm.x86.avx10.fpclass.bf16.256(<16 x bfloat> %x0, i32 2)
%1 = and <16 x i1> %res1, %res
%2 = bitcast <16 x i1> %1 to i16
ret i16 %2
}
-declare <8 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.128(<8 x bfloat>, <8 x bfloat>, i8)
-declare <16 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.256(<16 x bfloat>, <16 x bfloat>, i16)
+declare <8 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.128(<8 x bfloat>, <8 x bfloat>, i8)
+declare <16 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.256(<16 x bfloat>, <16 x bfloat>, i16)
-define <8 x bfloat>@test_int_x86_avx512_getexp_nepbf16_128(<8 x bfloat> %x0) {
-; CHECK-LABEL: test_int_x86_avx512_getexp_nepbf16_128:
+define <8 x bfloat>@test_int_x86_avx512_getexp_bf16_128(<8 x bfloat> %x0) {
+; CHECK-LABEL: test_int_x86_avx512_getexp_bf16_128:
; CHECK: # %bb.0:
-; CHECK-NEXT: vgetexppbf16 %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x42,0xc0]
+; CHECK-NEXT: vgetexpbf16 %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x42,0xc0]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res = call <8 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.128(<8 x bfloat> %x0, <8 x bfloat> zeroinitializer, i8 -1)
+ %res = call <8 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.128(<8 x bfloat> %x0, <8 x bfloat> zeroinitializer, i8 -1)
ret <8 x bfloat> %res
}
-define <8 x bfloat>@test_int_x86_avx512_mask_getexp_nepbf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1, i8 %x2) {
-; X64-LABEL: test_int_x86_avx512_mask_getexp_nepbf16_128:
+define <8 x bfloat>@test_int_x86_avx512_mask_getexp_bf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1, i8 %x2) {
+; X64-LABEL: test_int_x86_avx512_mask_getexp_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vgetexppbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x42,0xc8]
+; X64-NEXT: vgetexpbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x42,0xc8]
; X64-NEXT: vmovaps %xmm1, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_getexp_nepbf16_128:
+; X86-LABEL: test_int_x86_avx512_mask_getexp_bf16_128:
; X86: # %bb.0:
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vgetexppbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x42,0xc8]
+; X86-NEXT: vgetexpbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x42,0xc8]
; X86-NEXT: vmovaps %xmm1, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <8 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, i8 %x2)
+ %res = call <8 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, i8 %x2)
ret <8 x bfloat> %res
}
-define <8 x bfloat>@test_int_x86_avx512_maskz_getexp_nepbf16_128(<8 x bfloat> %x0, i8 %x2) {
-; X64-LABEL: test_int_x86_avx512_maskz_getexp_nepbf16_128:
+define <8 x bfloat>@test_int_x86_avx512_maskz_getexp_bf16_128(<8 x bfloat> %x0, i8 %x2) {
+; X64-LABEL: test_int_x86_avx512_maskz_getexp_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vgetexppbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x42,0xc0]
+; X64-NEXT: vgetexpbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x42,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_maskz_getexp_nepbf16_128:
+; X86-LABEL: test_int_x86_avx512_maskz_getexp_bf16_128:
; X86: # %bb.0:
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vgetexppbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x42,0xc0]
+; X86-NEXT: vgetexpbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x42,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <8 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.128(<8 x bfloat> %x0, <8 x bfloat> zeroinitializer, i8 %x2)
+ %res = call <8 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.128(<8 x bfloat> %x0, <8 x bfloat> zeroinitializer, i8 %x2)
ret <8 x bfloat> %res
}
-define <16 x bfloat>@test_int_x86_avx512_getexp_nepbf16_256(<16 x bfloat> %x0) {
-; CHECK-LABEL: test_int_x86_avx512_getexp_nepbf16_256:
+define <16 x bfloat>@test_int_x86_avx512_getexp_bf16_256(<16 x bfloat> %x0) {
+; CHECK-LABEL: test_int_x86_avx512_getexp_bf16_256:
; CHECK: # %bb.0:
-; CHECK-NEXT: vgetexppbf16 %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x42,0xc0]
+; CHECK-NEXT: vgetexpbf16 %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x42,0xc0]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res = call <16 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.256(<16 x bfloat> %x0, <16 x bfloat> zeroinitializer, i16 -1)
+ %res = call <16 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.256(<16 x bfloat> %x0, <16 x bfloat> zeroinitializer, i16 -1)
ret <16 x bfloat> %res
}
-define <16 x bfloat>@test_int_x86_avx512_mask_getexp_nepbf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1, i16 %x2) {
-; X64-LABEL: test_int_x86_avx512_mask_getexp_nepbf16_256:
+define <16 x bfloat>@test_int_x86_avx512_mask_getexp_bf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1, i16 %x2) {
+; X64-LABEL: test_int_x86_avx512_mask_getexp_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vgetexppbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x42,0xc8]
+; X64-NEXT: vgetexpbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x42,0xc8]
; X64-NEXT: vmovaps %ymm1, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_getexp_nepbf16_256:
+; X86-LABEL: test_int_x86_avx512_mask_getexp_bf16_256:
; X86: # %bb.0:
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vgetexppbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x42,0xc8]
+; X86-NEXT: vgetexpbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x42,0xc8]
; X86-NEXT: vmovaps %ymm1, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <16 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, i16 %x2)
+ %res = call <16 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, i16 %x2)
ret <16 x bfloat> %res
}
-define <16 x bfloat>@test_int_x86_avx512_maskz_getexp_nepbf16_256(<16 x bfloat> %x0, i16 %x2) {
-; X64-LABEL: test_int_x86_avx512_maskz_getexp_nepbf16_256:
+define <16 x bfloat>@test_int_x86_avx512_maskz_getexp_bf16_256(<16 x bfloat> %x0, i16 %x2) {
+; X64-LABEL: test_int_x86_avx512_maskz_getexp_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vgetexppbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x42,0xc0]
+; X64-NEXT: vgetexpbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x42,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_maskz_getexp_nepbf16_256:
+; X86-LABEL: test_int_x86_avx512_maskz_getexp_bf16_256:
; X86: # %bb.0:
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vgetexppbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x42,0xc0]
+; X86-NEXT: vgetexpbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x42,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <16 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.256(<16 x bfloat> %x0, <16 x bfloat> zeroinitializer, i16 %x2)
+ %res = call <16 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.256(<16 x bfloat> %x0, <16 x bfloat> zeroinitializer, i16 %x2)
ret <16 x bfloat> %res
}
-declare <8 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.128(<8 x bfloat>, i32, <8 x bfloat>, i8)
-declare <16 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.256(<16 x bfloat>, i32, <16 x bfloat>, i16)
+declare <8 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.128(<8 x bfloat>, i32, <8 x bfloat>, i8)
+declare <16 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.256(<16 x bfloat>, i32, <16 x bfloat>, i16)
-define <8 x bfloat>@test_int_x86_avx512_mask_getmant_nepbf16_128(<8 x bfloat> %x0, <8 x bfloat> %x2, i8 %x3) {
-; X64-LABEL: test_int_x86_avx512_mask_getmant_nepbf16_128:
+define <8 x bfloat>@test_int_x86_avx512_mask_getmant_bf16_128(<8 x bfloat> %x0, <8 x bfloat> %x2, i8 %x3) {
+; X64-LABEL: test_int_x86_avx512_mask_getmant_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vgetmantpbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x26,0xc8,0x08]
-; X64-NEXT: vgetmantpbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x26,0xc0,0x04]
-; X64-NEXT: vaddnepbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0]
+; X64-NEXT: vgetmantbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x26,0xc8,0x08]
+; X64-NEXT: vgetmantbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x26,0xc0,0x04]
+; X64-NEXT: vaddbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_getmant_nepbf16_128:
+; X86-LABEL: test_int_x86_avx512_mask_getmant_bf16_128:
; X86: # %bb.0:
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vgetmantpbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x26,0xc8,0x08]
-; X86-NEXT: vgetmantpbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x26,0xc0,0x04]
-; X86-NEXT: vaddnepbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0]
+; X86-NEXT: vgetmantbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x26,0xc8,0x08]
+; X86-NEXT: vgetmantbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x26,0xc0,0x04]
+; X86-NEXT: vaddbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <8 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.128(<8 x bfloat> %x0, i32 8, <8 x bfloat> %x2, i8 %x3)
- %res1 = call <8 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.128(<8 x bfloat> %x0, i32 4, <8 x bfloat> %x2, i8 -1)
+ %res = call <8 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.128(<8 x bfloat> %x0, i32 8, <8 x bfloat> %x2, i8 %x3)
+ %res1 = call <8 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.128(<8 x bfloat> %x0, i32 4, <8 x bfloat> %x2, i8 -1)
%res2 = fadd <8 x bfloat> %res, %res1
ret <8 x bfloat> %res2
}
-define <16 x bfloat>@test_int_x86_avx512_mask_getmant_nepbf16_256(<16 x bfloat> %x0, <16 x bfloat> %x2, i16 %x3) {
-; X64-LABEL: test_int_x86_avx512_mask_getmant_nepbf16_256:
+define <16 x bfloat>@test_int_x86_avx512_mask_getmant_bf16_256(<16 x bfloat> %x0, <16 x bfloat> %x2, i16 %x3) {
+; X64-LABEL: test_int_x86_avx512_mask_getmant_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vgetmantpbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x26,0xc8,0x08]
-; X64-NEXT: vgetmantpbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x26,0xc0,0x04]
-; X64-NEXT: vaddnepbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0]
+; X64-NEXT: vgetmantbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x26,0xc8,0x08]
+; X64-NEXT: vgetmantbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x26,0xc0,0x04]
+; X64-NEXT: vaddbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_getmant_nepbf16_256:
+; X86-LABEL: test_int_x86_avx512_mask_getmant_bf16_256:
; X86: # %bb.0:
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vgetmantpbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x26,0xc8,0x08]
-; X86-NEXT: vgetmantpbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x26,0xc0,0x04]
-; X86-NEXT: vaddnepbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0]
+; X86-NEXT: vgetmantbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x26,0xc8,0x08]
+; X86-NEXT: vgetmantbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x26,0xc0,0x04]
+; X86-NEXT: vaddbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <16 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.256(<16 x bfloat> %x0, i32 8, <16 x bfloat> %x2, i16 %x3)
- %res1 = call <16 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.256(<16 x bfloat> %x0, i32 4, <16 x bfloat> %x2, i16 -1)
+ %res = call <16 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.256(<16 x bfloat> %x0, i32 8, <16 x bfloat> %x2, i16 %x3)
+ %res1 = call <16 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.256(<16 x bfloat> %x0, i32 4, <16 x bfloat> %x2, i16 -1)
%res2 = fadd <16 x bfloat> %res, %res1
ret <16 x bfloat> %res2
}
-declare <8 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.128(<8 x bfloat>, i32, <8 x bfloat>, i8)
-declare <16 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.256(<16 x bfloat>, i32, <16 x bfloat>, i16)
+declare <8 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.128(<8 x bfloat>, i32, <8 x bfloat>, i8)
+declare <16 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.256(<16 x bfloat>, i32, <16 x bfloat>, i16)
-define <8 x bfloat>@test_int_x86_avx512_mask_rndscale_nepbf16_128(<8 x bfloat> %x0, <8 x bfloat> %x2, i8 %x3) {
-; X64-LABEL: test_int_x86_avx512_mask_rndscale_nepbf16_128:
+define <8 x bfloat>@test_int_x86_avx512_mask_rndscale_bf16_128(<8 x bfloat> %x0, <8 x bfloat> %x2, i8 %x3) {
+; X64-LABEL: test_int_x86_avx512_mask_rndscale_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vrndscalenepbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x08,0xc8,0x08]
-; X64-NEXT: vrndscalenepbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x08,0xc0,0x04]
-; X64-NEXT: vaddnepbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0]
+; X64-NEXT: vrndscalebf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x08,0xc8,0x08]
+; X64-NEXT: vrndscalebf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x08,0xc0,0x04]
+; X64-NEXT: vaddbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_rndscale_nepbf16_128:
+; X86-LABEL: test_int_x86_avx512_mask_rndscale_bf16_128:
; X86: # %bb.0:
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vrndscalenepbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x08,0xc8,0x08]
-; X86-NEXT: vrndscalenepbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x08,0xc0,0x04]
-; X86-NEXT: vaddnepbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0]
+; X86-NEXT: vrndscalebf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x08,0xc8,0x08]
+; X86-NEXT: vrndscalebf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x08,0xc0,0x04]
+; X86-NEXT: vaddbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <8 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.128(<8 x bfloat> %x0, i32 8, <8 x bfloat> %x2, i8 %x3)
- %res1 = call <8 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.128(<8 x bfloat> %x0, i32 4, <8 x bfloat> %x2, i8 -1)
+ %res = call <8 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.128(<8 x bfloat> %x0, i32 8, <8 x bfloat> %x2, i8 %x3)
+ %res1 = call <8 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.128(<8 x bfloat> %x0, i32 4, <8 x bfloat> %x2, i8 -1)
%res2 = fadd <8 x bfloat> %res, %res1
ret <8 x bfloat> %res2
}
-define <16 x bfloat>@test_int_x86_avx512_mask_rndscale_nepbf16_256(<16 x bfloat> %x0, <16 x bfloat> %x2, i16 %x3) {
-; X64-LABEL: test_int_x86_avx512_mask_rndscale_nepbf16_256:
+define <16 x bfloat>@test_int_x86_avx512_mask_rndscale_bf16_256(<16 x bfloat> %x0, <16 x bfloat> %x2, i16 %x3) {
+; X64-LABEL: test_int_x86_avx512_mask_rndscale_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vrndscalenepbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x08,0xc8,0x08]
-; X64-NEXT: vrndscalenepbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x08,0xc0,0x04]
-; X64-NEXT: vaddnepbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0]
+; X64-NEXT: vrndscalebf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x08,0xc8,0x08]
+; X64-NEXT: vrndscalebf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x08,0xc0,0x04]
+; X64-NEXT: vaddbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_rndscale_nepbf16_256:
+; X86-LABEL: test_int_x86_avx512_mask_rndscale_bf16_256:
; X86: # %bb.0:
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vrndscalenepbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x08,0xc8,0x08]
-; X86-NEXT: vrndscalenepbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x08,0xc0,0x04]
-; X86-NEXT: vaddnepbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0]
+; X86-NEXT: vrndscalebf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x08,0xc8,0x08]
+; X86-NEXT: vrndscalebf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x08,0xc0,0x04]
+; X86-NEXT: vaddbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0]
; X86-NEXT: retl # encoding: [0xc3]
- %res = call <16 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.256(<16 x bfloat> %x0, i32 8, <16 x bfloat> %x2, i16 %x3)
- %res1 = call <16 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.256(<16 x bfloat> %x0, i32 4, <16 x bfloat> %x2, i16 -1)
+ %res = call <16 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.256(<16 x bfloat> %x0, i32 8, <16 x bfloat> %x2, i16 %x3)
+ %res1 = call <16 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.256(<16 x bfloat> %x0, i32 4, <16 x bfloat> %x2, i16 -1)
%res2 = fadd <16 x bfloat> %res, %res1
ret <16 x bfloat> %res2
}
-declare <8 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.128(<8 x bfloat>, <8 x bfloat>, <8 x bfloat>, i8)
-declare <16 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.256(<16 x bfloat>, <16 x bfloat>, <16 x bfloat>, i16)
+declare <8 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.128(<8 x bfloat>, <8 x bfloat>, <8 x bfloat>, i8)
+declare <16 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.256(<16 x bfloat>, <16 x bfloat>, <16 x bfloat>, i16)
-define <8 x bfloat>@test_int_x86_avx512_scalef_nepbf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1) {
-; CHECK-LABEL: test_int_x86_avx512_scalef_nepbf16_128:
+define <8 x bfloat>@test_int_x86_avx512_scalef_bf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1) {
+; CHECK-LABEL: test_int_x86_avx512_scalef_bf16_128:
; CHECK: # %bb.0:
-; CHECK-NEXT: vscalefpbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf6,0x7c,0x08,0x2c,0xc1]
+; CHECK-NEXT: vscalefbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf6,0x7c,0x08,0x2c,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res = call <8 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> zeroinitializer, i8 -1)
+ %res = call <8 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> zeroinitializer, i8 -1)
ret <8 x bfloat> %res
}
-define <8 x bfloat>@test_int_x86_avx512_mask_scalef_nepbf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %x3) {
-; X64-LABEL: test_int_x86_avx512_mask_scalef_nepbf16_128:
+define <8 x bfloat>@test_int_x86_avx512_mask_scalef_bf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %x3) {
+; X64-LABEL: test_int_x86_avx512_mask_scalef_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vscalefpbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x2c,0xd1]
+; X64-NEXT: vscalefbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x2c,0xd1]
; X64-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_scalef_nepbf16_128:
+; X86-LABEL: test_int_x86_avx512_mask_scalef_bf16_128:
; X86: # %bb.0:
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vscalefpbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x2c,0xd1]
+; X86-NEXT: vscalefbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x2c,0xd1]
; X86-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i8 %x3 to <8 x i1>
- %res = call <8 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %x3)
+ %res = call <8 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %x3)
ret <8 x bfloat> %res
}
-define <8 x bfloat>@test_int_x86_avx512_maskz_scalef_nepbf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1, i8 %x3) {
-; X64-LABEL: test_int_x86_avx512_maskz_scalef_nepbf16_128:
+define <8 x bfloat>@test_int_x86_avx512_maskz_scalef_bf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1, i8 %x3) {
+; X64-LABEL: test_int_x86_avx512_maskz_scalef_bf16_128:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vscalefpbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0x89,0x2c,0xc1]
+; X64-NEXT: vscalefbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0x89,0x2c,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_maskz_scalef_nepbf16_128:
+; X86-LABEL: test_int_x86_avx512_maskz_scalef_bf16_128:
; X86: # %bb.0:
; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vscalefpbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0x89,0x2c,0xc1]
+; X86-NEXT: vscalefbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0x89,0x2c,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i8 %x3 to <8 x i1>
- %res = call <8 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> zeroinitializer, i8 %x3)
+ %res = call <8 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> zeroinitializer, i8 %x3)
ret <8 x bfloat> %res
}
-define <16 x bfloat>@test_int_x86_avx512_scalef_nepbf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1) {
-; CHECK-LABEL: test_int_x86_avx512_scalef_nepbf16_256:
+define <16 x bfloat>@test_int_x86_avx512_scalef_bf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1) {
+; CHECK-LABEL: test_int_x86_avx512_scalef_bf16_256:
; CHECK: # %bb.0:
-; CHECK-NEXT: vscalefpbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf6,0x7c,0x28,0x2c,0xc1]
+; CHECK-NEXT: vscalefbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf6,0x7c,0x28,0x2c,0xc1]
; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3]
- %res = call <16 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> zeroinitializer, i16 -1)
+ %res = call <16 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> zeroinitializer, i16 -1)
ret <16 x bfloat> %res
}
-define <16 x bfloat>@test_int_x86_avx512_mask_scalef_nepbf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %x3) {
-; X64-LABEL: test_int_x86_avx512_mask_scalef_nepbf16_256:
+define <16 x bfloat>@test_int_x86_avx512_mask_scalef_bf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %x3) {
+; X64-LABEL: test_int_x86_avx512_mask_scalef_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vscalefpbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x2c,0xd1]
+; X64-NEXT: vscalefbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x2c,0xd1]
; X64-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_mask_scalef_nepbf16_256:
+; X86-LABEL: test_int_x86_avx512_mask_scalef_bf16_256:
; X86: # %bb.0:
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vscalefpbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x2c,0xd1]
+; X86-NEXT: vscalefbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x2c,0xd1]
; X86-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i16 %x3 to <16 x i1>
- %res = call <16 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %x3)
+ %res = call <16 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %x3)
ret <16 x bfloat> %res
}
-define <16 x bfloat>@test_int_x86_avx512_maskz_scalef_nepbf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1, i16 %x3) {
-; X64-LABEL: test_int_x86_avx512_maskz_scalef_nepbf16_256:
+define <16 x bfloat>@test_int_x86_avx512_maskz_scalef_bf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1, i16 %x3) {
+; X64-LABEL: test_int_x86_avx512_maskz_scalef_bf16_256:
; X64: # %bb.0:
; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf]
-; X64-NEXT: vscalefpbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0xa9,0x2c,0xc1]
+; X64-NEXT: vscalefbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0xa9,0x2c,0xc1]
; X64-NEXT: retq # encoding: [0xc3]
;
-; X86-LABEL: test_int_x86_avx512_maskz_scalef_nepbf16_256:
+; X86-LABEL: test_int_x86_avx512_maskz_scalef_bf16_256:
; X86: # %bb.0:
; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04]
-; X86-NEXT: vscalefpbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0xa9,0x2c,0xc1]
+; X86-NEXT: vscalefbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0xa9,0x2c,0xc1]
; X86-NEXT: retl # encoding: [0xc3]
%mask = bitcast i16 %x3 to <16 x i1>
- %res = call <16 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> zeroinitializer, i16 %x3)
+ %res = call <16 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> zeroinitializer, i16 %x3)
ret <16 x bfloat> %res
}
diff --git a/llvm/test/MC/Disassembler/X86/avx10.2-bf16-32.txt b/llvm/test/MC/Disassembler/X86/avx10.2-bf16-32.txt
index 8cc53db077e4f7..b278f1d46e4d5f 100644
--- a/llvm/test/MC/Disassembler/X86/avx10.2-bf16-32.txt
+++ b/llvm/test/MC/Disassembler/X86/avx10.2-bf16-32.txt
@@ -1,208 +1,208 @@
# RUN: llvm-mc --disassemble %s -triple=i386 | FileCheck %s --check-prefixes=ATT
# RUN: llvm-mc --disassemble %s -triple=i386 --output-asm-variant=1 | FileCheck %s --check-prefixes=INTEL
-# ATT: vaddnepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vaddnepbf16 ymm2, ymm3, ymm4
+# ATT: vaddbf16 %ymm4, %ymm3, %ymm2
+# INTEL: vaddbf16 ymm2, ymm3, ymm4
0x62,0xf5,0x65,0x28,0x58,0xd4
-# ATT: vaddnepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vaddnepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vaddbf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vaddbf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf5,0x65,0x2f,0x58,0xd4
-# ATT: vaddnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vaddnepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vaddbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vaddbf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf5,0x65,0xaf,0x58,0xd4
-# ATT: vaddnepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vaddnepbf16 zmm2, zmm3, zmm4
+# ATT: vaddbf16 %zmm4, %zmm3, %zmm2
+# INTEL: vaddbf16 zmm2, zmm3, zmm4
0x62,0xf5,0x65,0x48,0x58,0xd4
-# ATT: vaddnepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vaddnepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vaddbf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vaddbf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf5,0x65,0x4f,0x58,0xd4
-# ATT: vaddnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vaddnepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vaddbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vaddbf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf5,0x65,0xcf,0x58,0xd4
-# ATT: vaddnepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vaddnepbf16 xmm2, xmm3, xmm4
+# ATT: vaddbf16 %xmm4, %xmm3, %xmm2
+# INTEL: vaddbf16 xmm2, xmm3, xmm4
0x62,0xf5,0x65,0x08,0x58,0xd4
-# ATT: vaddnepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vaddnepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vaddbf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vaddbf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf5,0x65,0x0f,0x58,0xd4
-# ATT: vaddnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vaddnepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vaddbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vaddbf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf5,0x65,0x8f,0x58,0xd4
-# ATT: vaddnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vaddnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vaddbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vaddbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x48,0x58,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vaddnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vaddnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vaddbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vaddbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x4f,0x58,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vaddnepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vaddnepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vaddbf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vaddbf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf5,0x65,0x58,0x58,0x10
-# ATT: vaddnepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vaddnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vaddbf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vaddbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x65,0x48,0x58,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vaddnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vaddnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vaddbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vaddbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf5,0x65,0xcf,0x58,0x51,0x7f
-# ATT: vaddnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vaddnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vaddbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vaddbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf5,0x65,0xdf,0x58,0x52,0x80
-# ATT: vaddnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vaddnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vaddbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vaddbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x28,0x58,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vaddnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vaddnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vaddbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vaddbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x2f,0x58,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vaddnepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vaddnepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vaddbf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vaddbf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf5,0x65,0x38,0x58,0x10
-# ATT: vaddnepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vaddnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vaddbf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vaddbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x65,0x28,0x58,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vaddnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vaddnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vaddbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vaddbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf5,0x65,0xaf,0x58,0x51,0x7f
-# ATT: vaddnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vaddnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vaddbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vaddbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf5,0x65,0xbf,0x58,0x52,0x80
-# ATT: vaddnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vaddnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vaddbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vaddbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x08,0x58,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vaddnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vaddnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vaddbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vaddbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x0f,0x58,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vaddnepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vaddnepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vaddbf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vaddbf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf5,0x65,0x18,0x58,0x10
-# ATT: vaddnepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vaddnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vaddbf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vaddbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x65,0x08,0x58,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vaddnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vaddnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vaddbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vaddbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf5,0x65,0x8f,0x58,0x51,0x7f
-# ATT: vaddnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vaddnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vaddbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vaddbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf5,0x65,0x9f,0x58,0x52,0x80
-# ATT: vcmppbf16 $123, %ymm4, %ymm3, %k5
-# INTEL: vcmppbf16 k5, ymm3, ymm4, 123
+# ATT: vcmpbf16 $123, %ymm4, %ymm3, %k5
+# INTEL: vcmpbf16 k5, ymm3, ymm4, 123
0x62,0xf3,0x67,0x28,0xc2,0xec,0x7b
-# ATT: vcmppbf16 $123, %ymm4, %ymm3, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, ymm3, ymm4, 123
+# ATT: vcmpbf16 $123, %ymm4, %ymm3, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, ymm3, ymm4, 123
0x62,0xf3,0x67,0x2f,0xc2,0xec,0x7b
-# ATT: vcmppbf16 $123, %xmm4, %xmm3, %k5
-# INTEL: vcmppbf16 k5, xmm3, xmm4, 123
+# ATT: vcmpbf16 $123, %xmm4, %xmm3, %k5
+# INTEL: vcmpbf16 k5, xmm3, xmm4, 123
0x62,0xf3,0x67,0x08,0xc2,0xec,0x7b
-# ATT: vcmppbf16 $123, %xmm4, %xmm3, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, xmm3, xmm4, 123
+# ATT: vcmpbf16 $123, %xmm4, %xmm3, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, xmm3, xmm4, 123
0x62,0xf3,0x67,0x0f,0xc2,0xec,0x7b
-# ATT: vcmppbf16 $123, %zmm4, %zmm3, %k5
-# INTEL: vcmppbf16 k5, zmm3, zmm4, 123
+# ATT: vcmpbf16 $123, %zmm4, %zmm3, %k5
+# INTEL: vcmpbf16 k5, zmm3, zmm4, 123
0x62,0xf3,0x67,0x48,0xc2,0xec,0x7b
-# ATT: vcmppbf16 $123, %zmm4, %zmm3, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, zmm3, zmm4, 123
+# ATT: vcmpbf16 $123, %zmm4, %zmm3, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, zmm3, zmm4, 123
0x62,0xf3,0x67,0x4f,0xc2,0xec,0x7b
-# ATT: vcmppbf16 $123, 268435456(%esp,%esi,8), %zmm3, %k5
-# INTEL: vcmppbf16 k5, zmm3, zmmword ptr [esp + 8*esi + 268435456], 123
+# ATT: vcmpbf16 $123, 268435456(%esp,%esi,8), %zmm3, %k5
+# INTEL: vcmpbf16 k5, zmm3, zmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x67,0x48,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b
-# ATT: vcmppbf16 $123, 291(%edi,%eax,4), %zmm3, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291], 123
+# ATT: vcmpbf16 $123, 291(%edi,%eax,4), %zmm3, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x67,0x4f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b
-# ATT: vcmppbf16 $123, (%eax){1to32}, %zmm3, %k5
-# INTEL: vcmppbf16 k5, zmm3, word ptr [eax]{1to32}, 123
+# ATT: vcmpbf16 $123, (%eax){1to32}, %zmm3, %k5
+# INTEL: vcmpbf16 k5, zmm3, word ptr [eax]{1to32}, 123
0x62,0xf3,0x67,0x58,0xc2,0x28,0x7b
-# ATT: vcmppbf16 $123, -2048(,%ebp,2), %zmm3, %k5
-# INTEL: vcmppbf16 k5, zmm3, zmmword ptr [2*ebp - 2048], 123
+# ATT: vcmpbf16 $123, -2048(,%ebp,2), %zmm3, %k5
+# INTEL: vcmpbf16 k5, zmm3, zmmword ptr [2*ebp - 2048], 123
0x62,0xf3,0x67,0x48,0xc2,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b
-# ATT: vcmppbf16 $123, 8128(%ecx), %zmm3, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, zmm3, zmmword ptr [ecx + 8128], 123
+# ATT: vcmpbf16 $123, 8128(%ecx), %zmm3, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, zmm3, zmmword ptr [ecx + 8128], 123
0x62,0xf3,0x67,0x4f,0xc2,0x69,0x7f,0x7b
-# ATT: vcmppbf16 $123, -256(%edx){1to32}, %zmm3, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, zmm3, word ptr [edx - 256]{1to32}, 123
+# ATT: vcmpbf16 $123, -256(%edx){1to32}, %zmm3, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, zmm3, word ptr [edx - 256]{1to32}, 123
0x62,0xf3,0x67,0x5f,0xc2,0x6a,0x80,0x7b
-# ATT: vcmppbf16 $123, 268435456(%esp,%esi,8), %xmm3, %k5
-# INTEL: vcmppbf16 k5, xmm3, xmmword ptr [esp + 8*esi + 268435456], 123
+# ATT: vcmpbf16 $123, 268435456(%esp,%esi,8), %xmm3, %k5
+# INTEL: vcmpbf16 k5, xmm3, xmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x67,0x08,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b
-# ATT: vcmppbf16 $123, 291(%edi,%eax,4), %xmm3, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291], 123
+# ATT: vcmpbf16 $123, 291(%edi,%eax,4), %xmm3, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x67,0x0f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b
-# ATT: vcmppbf16 $123, (%eax){1to8}, %xmm3, %k5
-# INTEL: vcmppbf16 k5, xmm3, word ptr [eax]{1to8}, 123
+# ATT: vcmpbf16 $123, (%eax){1to8}, %xmm3, %k5
+# INTEL: vcmpbf16 k5, xmm3, word ptr [eax]{1to8}, 123
0x62,0xf3,0x67,0x18,0xc2,0x28,0x7b
-# ATT: vcmppbf16 $123, -512(,%ebp,2), %xmm3, %k5
-# INTEL: vcmppbf16 k5, xmm3, xmmword ptr [2*ebp - 512], 123
+# ATT: vcmpbf16 $123, -512(,%ebp,2), %xmm3, %k5
+# INTEL: vcmpbf16 k5, xmm3, xmmword ptr [2*ebp - 512], 123
0x62,0xf3,0x67,0x08,0xc2,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b
-# ATT: vcmppbf16 $123, 2032(%ecx), %xmm3, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, xmm3, xmmword ptr [ecx + 2032], 123
+# ATT: vcmpbf16 $123, 2032(%ecx), %xmm3, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, xmm3, xmmword ptr [ecx + 2032], 123
0x62,0xf3,0x67,0x0f,0xc2,0x69,0x7f,0x7b
-# ATT: vcmppbf16 $123, -256(%edx){1to8}, %xmm3, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, xmm3, word ptr [edx - 256]{1to8}, 123
+# ATT: vcmpbf16 $123, -256(%edx){1to8}, %xmm3, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, xmm3, word ptr [edx - 256]{1to8}, 123
0x62,0xf3,0x67,0x1f,0xc2,0x6a,0x80,0x7b
-# ATT: vcmppbf16 $123, 268435456(%esp,%esi,8), %ymm3, %k5
-# INTEL: vcmppbf16 k5, ymm3, ymmword ptr [esp + 8*esi + 268435456], 123
+# ATT: vcmpbf16 $123, 268435456(%esp,%esi,8), %ymm3, %k5
+# INTEL: vcmpbf16 k5, ymm3, ymmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x67,0x28,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b
-# ATT: vcmppbf16 $123, 291(%edi,%eax,4), %ymm3, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291], 123
+# ATT: vcmpbf16 $123, 291(%edi,%eax,4), %ymm3, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x67,0x2f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b
-# ATT: vcmppbf16 $123, (%eax){1to16}, %ymm3, %k5
-# INTEL: vcmppbf16 k5, ymm3, word ptr [eax]{1to16}, 123
+# ATT: vcmpbf16 $123, (%eax){1to16}, %ymm3, %k5
+# INTEL: vcmpbf16 k5, ymm3, word ptr [eax]{1to16}, 123
0x62,0xf3,0x67,0x38,0xc2,0x28,0x7b
-# ATT: vcmppbf16 $123, -1024(,%ebp,2), %ymm3, %k5
-# INTEL: vcmppbf16 k5, ymm3, ymmword ptr [2*ebp - 1024], 123
+# ATT: vcmpbf16 $123, -1024(,%ebp,2), %ymm3, %k5
+# INTEL: vcmpbf16 k5, ymm3, ymmword ptr [2*ebp - 1024], 123
0x62,0xf3,0x67,0x28,0xc2,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b
-# ATT: vcmppbf16 $123, 4064(%ecx), %ymm3, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, ymm3, ymmword ptr [ecx + 4064], 123
+# ATT: vcmpbf16 $123, 4064(%ecx), %ymm3, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, ymm3, ymmword ptr [ecx + 4064], 123
0x62,0xf3,0x67,0x2f,0xc2,0x69,0x7f,0x7b
-# ATT: vcmppbf16 $123, -256(%edx){1to16}, %ymm3, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, ymm3, word ptr [edx - 256]{1to16}, 123
+# ATT: vcmpbf16 $123, -256(%edx){1to16}, %ymm3, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, ymm3, word ptr [edx - 256]{1to16}, 123
0x62,0xf3,0x67,0x3f,0xc2,0x6a,0x80,0x7b
# ATT: vcomsbf16 %xmm3, %xmm2
@@ -233,2783 +233,2783 @@
# INTEL: vcomsbf16 xmm2, word ptr [edx - 256]
0x62,0xf5,0x7d,0x08,0x2f,0x52,0x80
-# ATT: vdivnepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vdivnepbf16 ymm2, ymm3, ymm4
+# ATT: vdivbf16 %ymm4, %ymm3, %ymm2
+# INTEL: vdivbf16 ymm2, ymm3, ymm4
0x62,0xf5,0x65,0x28,0x5e,0xd4
-# ATT: vdivnepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vdivnepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vdivbf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vdivbf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf5,0x65,0x2f,0x5e,0xd4
-# ATT: vdivnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vdivnepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vdivbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vdivbf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf5,0x65,0xaf,0x5e,0xd4
-# ATT: vdivnepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vdivnepbf16 zmm2, zmm3, zmm4
+# ATT: vdivbf16 %zmm4, %zmm3, %zmm2
+# INTEL: vdivbf16 zmm2, zmm3, zmm4
0x62,0xf5,0x65,0x48,0x5e,0xd4
-# ATT: vdivnepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vdivnepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vdivbf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vdivbf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf5,0x65,0x4f,0x5e,0xd4
-# ATT: vdivnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vdivnepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vdivbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vdivbf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf5,0x65,0xcf,0x5e,0xd4
-# ATT: vdivnepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vdivnepbf16 xmm2, xmm3, xmm4
+# ATT: vdivbf16 %xmm4, %xmm3, %xmm2
+# INTEL: vdivbf16 xmm2, xmm3, xmm4
0x62,0xf5,0x65,0x08,0x5e,0xd4
-# ATT: vdivnepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vdivnepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vdivbf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vdivbf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf5,0x65,0x0f,0x5e,0xd4
-# ATT: vdivnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vdivnepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vdivbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vdivbf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf5,0x65,0x8f,0x5e,0xd4
-# ATT: vdivnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vdivnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vdivbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vdivbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x48,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vdivnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vdivnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vdivbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vdivbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x4f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vdivnepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vdivnepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vdivbf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vdivbf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf5,0x65,0x58,0x5e,0x10
-# ATT: vdivnepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vdivnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vdivbf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vdivbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x65,0x48,0x5e,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vdivnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vdivnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vdivbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vdivbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf5,0x65,0xcf,0x5e,0x51,0x7f
-# ATT: vdivnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vdivnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vdivbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vdivbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf5,0x65,0xdf,0x5e,0x52,0x80
-# ATT: vdivnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vdivnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vdivbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vdivbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x28,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vdivnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vdivnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vdivbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vdivbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x2f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vdivnepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vdivnepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vdivbf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vdivbf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf5,0x65,0x38,0x5e,0x10
-# ATT: vdivnepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vdivnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vdivbf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vdivbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x65,0x28,0x5e,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vdivnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vdivnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vdivbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vdivbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf5,0x65,0xaf,0x5e,0x51,0x7f
-# ATT: vdivnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vdivnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vdivbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vdivbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf5,0x65,0xbf,0x5e,0x52,0x80
-# ATT: vdivnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vdivnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vdivbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vdivbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x08,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vdivnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vdivnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vdivbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vdivbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x0f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vdivnepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vdivnepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vdivbf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vdivbf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf5,0x65,0x18,0x5e,0x10
-# ATT: vdivnepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vdivnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vdivbf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vdivbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x65,0x08,0x5e,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vdivnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vdivnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vdivbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vdivbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf5,0x65,0x8f,0x5e,0x51,0x7f
-# ATT: vdivnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vdivnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vdivbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vdivbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf5,0x65,0x9f,0x5e,0x52,0x80
-# ATT: vfmadd132nepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vfmadd132nepbf16 ymm2, ymm3, ymm4
+# ATT: vfmadd132bf16 %ymm4, %ymm3, %ymm2
+# INTEL: vfmadd132bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0x98,0xd4
-# ATT: vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vfmadd132nepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vfmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vfmadd132bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0x98,0xd4
-# ATT: vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vfmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmadd132bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0x98,0xd4
-# ATT: vfmadd132nepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vfmadd132nepbf16 zmm2, zmm3, zmm4
+# ATT: vfmadd132bf16 %zmm4, %zmm3, %zmm2
+# INTEL: vfmadd132bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0x98,0xd4
-# ATT: vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vfmadd132nepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vfmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vfmadd132bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0x98,0xd4
-# ATT: vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vfmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmadd132bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0x98,0xd4
-# ATT: vfmadd132nepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vfmadd132nepbf16 xmm2, xmm3, xmm4
+# ATT: vfmadd132bf16 %xmm4, %xmm3, %xmm2
+# INTEL: vfmadd132bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0x98,0xd4
-# ATT: vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vfmadd132nepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vfmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vfmadd132bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0x98,0xd4
-# ATT: vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vfmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmadd132bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0x98,0xd4
-# ATT: vfmadd132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vfmadd132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmadd132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vfmadd132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0x98,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmadd132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vfmadd132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vfmadd132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vfmadd132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0x98,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmadd132nepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vfmadd132nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vfmadd132bf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vfmadd132bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0x98,0x10
-# ATT: vfmadd132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vfmadd132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vfmadd132bf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vfmadd132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0x98,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfmadd132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vfmadd132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmadd132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0x98,0x51,0x7f
-# ATT: vfmadd132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vfmadd132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmadd132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0x98,0x52,0x80
-# ATT: vfmadd132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vfmadd132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmadd132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vfmadd132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0x98,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmadd132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vfmadd132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vfmadd132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vfmadd132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0x98,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmadd132nepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vfmadd132nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vfmadd132bf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vfmadd132bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0x98,0x10
-# ATT: vfmadd132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vfmadd132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vfmadd132bf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vfmadd132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0x98,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfmadd132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vfmadd132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmadd132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0x98,0x51,0x7f
-# ATT: vfmadd132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vfmadd132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmadd132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0x98,0x52,0x80
-# ATT: vfmadd132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vfmadd132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmadd132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vfmadd132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0x98,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmadd132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vfmadd132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vfmadd132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vfmadd132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0x98,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmadd132nepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vfmadd132nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vfmadd132bf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vfmadd132bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0x98,0x10
-# ATT: vfmadd132nepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vfmadd132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vfmadd132bf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vfmadd132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0x98,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfmadd132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vfmadd132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmadd132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0x98,0x51,0x7f
-# ATT: vfmadd132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vfmadd132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmadd132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0x98,0x52,0x80
-# ATT: vfmadd213nepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vfmadd213nepbf16 ymm2, ymm3, ymm4
+# ATT: vfmadd213bf16 %ymm4, %ymm3, %ymm2
+# INTEL: vfmadd213bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xa8,0xd4
-# ATT: vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vfmadd213nepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vfmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vfmadd213bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xa8,0xd4
-# ATT: vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vfmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmadd213bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xa8,0xd4
-# ATT: vfmadd213nepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vfmadd213nepbf16 zmm2, zmm3, zmm4
+# ATT: vfmadd213bf16 %zmm4, %zmm3, %zmm2
+# INTEL: vfmadd213bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xa8,0xd4
-# ATT: vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vfmadd213nepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vfmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vfmadd213bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xa8,0xd4
-# ATT: vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vfmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmadd213bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xa8,0xd4
-# ATT: vfmadd213nepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vfmadd213nepbf16 xmm2, xmm3, xmm4
+# ATT: vfmadd213bf16 %xmm4, %xmm3, %xmm2
+# INTEL: vfmadd213bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xa8,0xd4
-# ATT: vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vfmadd213nepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vfmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vfmadd213bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xa8,0xd4
-# ATT: vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vfmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmadd213bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xa8,0xd4
-# ATT: vfmadd213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vfmadd213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmadd213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vfmadd213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmadd213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vfmadd213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vfmadd213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vfmadd213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmadd213nepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vfmadd213nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vfmadd213bf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vfmadd213bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xa8,0x10
-# ATT: vfmadd213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vfmadd213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vfmadd213bf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vfmadd213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xa8,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfmadd213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vfmadd213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmadd213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xa8,0x51,0x7f
-# ATT: vfmadd213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vfmadd213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmadd213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xa8,0x52,0x80
-# ATT: vfmadd213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vfmadd213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmadd213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vfmadd213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmadd213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vfmadd213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vfmadd213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vfmadd213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmadd213nepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vfmadd213nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vfmadd213bf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vfmadd213bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xa8,0x10
-# ATT: vfmadd213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vfmadd213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vfmadd213bf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vfmadd213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xa8,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfmadd213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vfmadd213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmadd213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xa8,0x51,0x7f
-# ATT: vfmadd213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vfmadd213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmadd213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xa8,0x52,0x80
-# ATT: vfmadd213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vfmadd213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmadd213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vfmadd213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmadd213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vfmadd213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vfmadd213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vfmadd213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmadd213nepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vfmadd213nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vfmadd213bf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vfmadd213bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xa8,0x10
-# ATT: vfmadd213nepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vfmadd213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vfmadd213bf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vfmadd213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xa8,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfmadd213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vfmadd213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmadd213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xa8,0x51,0x7f
-# ATT: vfmadd213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vfmadd213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmadd213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xa8,0x52,0x80
-# ATT: vfmadd231nepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vfmadd231nepbf16 ymm2, ymm3, ymm4
+# ATT: vfmadd231bf16 %ymm4, %ymm3, %ymm2
+# INTEL: vfmadd231bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xb8,0xd4
-# ATT: vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vfmadd231nepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vfmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vfmadd231bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xb8,0xd4
-# ATT: vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vfmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmadd231bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xb8,0xd4
-# ATT: vfmadd231nepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vfmadd231nepbf16 zmm2, zmm3, zmm4
+# ATT: vfmadd231bf16 %zmm4, %zmm3, %zmm2
+# INTEL: vfmadd231bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xb8,0xd4
-# ATT: vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vfmadd231nepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vfmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vfmadd231bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xb8,0xd4
-# ATT: vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vfmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmadd231bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xb8,0xd4
-# ATT: vfmadd231nepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vfmadd231nepbf16 xmm2, xmm3, xmm4
+# ATT: vfmadd231bf16 %xmm4, %xmm3, %xmm2
+# INTEL: vfmadd231bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xb8,0xd4
-# ATT: vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vfmadd231nepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vfmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vfmadd231bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xb8,0xd4
-# ATT: vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vfmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmadd231bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xb8,0xd4
-# ATT: vfmadd231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vfmadd231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmadd231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vfmadd231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmadd231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vfmadd231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vfmadd231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vfmadd231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmadd231nepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vfmadd231nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vfmadd231bf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vfmadd231bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xb8,0x10
-# ATT: vfmadd231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vfmadd231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vfmadd231bf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vfmadd231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xb8,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfmadd231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vfmadd231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmadd231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xb8,0x51,0x7f
-# ATT: vfmadd231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vfmadd231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmadd231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xb8,0x52,0x80
-# ATT: vfmadd231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vfmadd231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmadd231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vfmadd231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmadd231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vfmadd231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vfmadd231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vfmadd231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmadd231nepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vfmadd231nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vfmadd231bf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vfmadd231bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xb8,0x10
-# ATT: vfmadd231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vfmadd231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vfmadd231bf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vfmadd231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xb8,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfmadd231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vfmadd231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmadd231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xb8,0x51,0x7f
-# ATT: vfmadd231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vfmadd231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmadd231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xb8,0x52,0x80
-# ATT: vfmadd231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vfmadd231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmadd231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vfmadd231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmadd231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vfmadd231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vfmadd231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vfmadd231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmadd231nepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vfmadd231nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vfmadd231bf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vfmadd231bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xb8,0x10
-# ATT: vfmadd231nepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vfmadd231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vfmadd231bf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vfmadd231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xb8,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfmadd231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vfmadd231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmadd231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xb8,0x51,0x7f
-# ATT: vfmadd231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vfmadd231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmadd231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xb8,0x52,0x80
-# ATT: vfmsub132nepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vfmsub132nepbf16 ymm2, ymm3, ymm4
+# ATT: vfmsub132bf16 %ymm4, %ymm3, %ymm2
+# INTEL: vfmsub132bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0x9a,0xd4
-# ATT: vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vfmsub132nepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vfmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vfmsub132bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0x9a,0xd4
-# ATT: vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vfmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmsub132bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0x9a,0xd4
-# ATT: vfmsub132nepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vfmsub132nepbf16 zmm2, zmm3, zmm4
+# ATT: vfmsub132bf16 %zmm4, %zmm3, %zmm2
+# INTEL: vfmsub132bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0x9a,0xd4
-# ATT: vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vfmsub132nepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vfmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vfmsub132bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0x9a,0xd4
-# ATT: vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vfmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmsub132bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0x9a,0xd4
-# ATT: vfmsub132nepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vfmsub132nepbf16 xmm2, xmm3, xmm4
+# ATT: vfmsub132bf16 %xmm4, %xmm3, %xmm2
+# INTEL: vfmsub132bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0x9a,0xd4
-# ATT: vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vfmsub132nepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vfmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vfmsub132bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0x9a,0xd4
-# ATT: vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vfmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmsub132bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0x9a,0xd4
-# ATT: vfmsub132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vfmsub132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmsub132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vfmsub132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmsub132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vfmsub132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vfmsub132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vfmsub132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmsub132nepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vfmsub132nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vfmsub132bf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vfmsub132bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0x9a,0x10
-# ATT: vfmsub132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vfmsub132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vfmsub132bf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vfmsub132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0x9a,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfmsub132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vfmsub132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmsub132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0x9a,0x51,0x7f
-# ATT: vfmsub132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vfmsub132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmsub132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0x9a,0x52,0x80
-# ATT: vfmsub132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vfmsub132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmsub132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vfmsub132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmsub132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vfmsub132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vfmsub132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vfmsub132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmsub132nepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vfmsub132nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vfmsub132bf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vfmsub132bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0x9a,0x10
-# ATT: vfmsub132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vfmsub132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vfmsub132bf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vfmsub132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0x9a,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfmsub132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vfmsub132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmsub132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0x9a,0x51,0x7f
-# ATT: vfmsub132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vfmsub132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmsub132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0x9a,0x52,0x80
-# ATT: vfmsub132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vfmsub132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmsub132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vfmsub132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmsub132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vfmsub132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vfmsub132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vfmsub132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmsub132nepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vfmsub132nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vfmsub132bf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vfmsub132bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0x9a,0x10
-# ATT: vfmsub132nepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vfmsub132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vfmsub132bf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vfmsub132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0x9a,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfmsub132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vfmsub132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmsub132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0x9a,0x51,0x7f
-# ATT: vfmsub132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vfmsub132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmsub132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0x9a,0x52,0x80
-# ATT: vfmsub213nepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vfmsub213nepbf16 ymm2, ymm3, ymm4
+# ATT: vfmsub213bf16 %ymm4, %ymm3, %ymm2
+# INTEL: vfmsub213bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xaa,0xd4
-# ATT: vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vfmsub213nepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vfmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vfmsub213bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xaa,0xd4
-# ATT: vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vfmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmsub213bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xaa,0xd4
-# ATT: vfmsub213nepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vfmsub213nepbf16 zmm2, zmm3, zmm4
+# ATT: vfmsub213bf16 %zmm4, %zmm3, %zmm2
+# INTEL: vfmsub213bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xaa,0xd4
-# ATT: vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vfmsub213nepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vfmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vfmsub213bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xaa,0xd4
-# ATT: vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vfmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmsub213bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xaa,0xd4
-# ATT: vfmsub213nepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vfmsub213nepbf16 xmm2, xmm3, xmm4
+# ATT: vfmsub213bf16 %xmm4, %xmm3, %xmm2
+# INTEL: vfmsub213bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xaa,0xd4
-# ATT: vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vfmsub213nepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vfmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vfmsub213bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xaa,0xd4
-# ATT: vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vfmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmsub213bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xaa,0xd4
-# ATT: vfmsub213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vfmsub213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmsub213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vfmsub213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmsub213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vfmsub213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vfmsub213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vfmsub213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmsub213nepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vfmsub213nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vfmsub213bf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vfmsub213bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xaa,0x10
-# ATT: vfmsub213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vfmsub213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vfmsub213bf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vfmsub213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xaa,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfmsub213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vfmsub213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmsub213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xaa,0x51,0x7f
-# ATT: vfmsub213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vfmsub213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmsub213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xaa,0x52,0x80
-# ATT: vfmsub213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vfmsub213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmsub213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vfmsub213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmsub213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vfmsub213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vfmsub213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vfmsub213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmsub213nepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vfmsub213nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vfmsub213bf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vfmsub213bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xaa,0x10
-# ATT: vfmsub213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vfmsub213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vfmsub213bf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vfmsub213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xaa,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfmsub213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vfmsub213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmsub213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xaa,0x51,0x7f
-# ATT: vfmsub213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vfmsub213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmsub213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xaa,0x52,0x80
-# ATT: vfmsub213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vfmsub213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmsub213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vfmsub213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmsub213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vfmsub213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vfmsub213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vfmsub213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmsub213nepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vfmsub213nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vfmsub213bf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vfmsub213bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xaa,0x10
-# ATT: vfmsub213nepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vfmsub213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vfmsub213bf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vfmsub213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xaa,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfmsub213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vfmsub213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmsub213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xaa,0x51,0x7f
-# ATT: vfmsub213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vfmsub213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmsub213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xaa,0x52,0x80
-# ATT: vfmsub231nepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vfmsub231nepbf16 ymm2, ymm3, ymm4
+# ATT: vfmsub231bf16 %ymm4, %ymm3, %ymm2
+# INTEL: vfmsub231bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xba,0xd4
-# ATT: vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vfmsub231nepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vfmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vfmsub231bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xba,0xd4
-# ATT: vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vfmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmsub231bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xba,0xd4
-# ATT: vfmsub231nepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vfmsub231nepbf16 zmm2, zmm3, zmm4
+# ATT: vfmsub231bf16 %zmm4, %zmm3, %zmm2
+# INTEL: vfmsub231bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xba,0xd4
-# ATT: vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vfmsub231nepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vfmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vfmsub231bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xba,0xd4
-# ATT: vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vfmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmsub231bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xba,0xd4
-# ATT: vfmsub231nepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vfmsub231nepbf16 xmm2, xmm3, xmm4
+# ATT: vfmsub231bf16 %xmm4, %xmm3, %xmm2
+# INTEL: vfmsub231bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xba,0xd4
-# ATT: vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vfmsub231nepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vfmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vfmsub231bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xba,0xd4
-# ATT: vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vfmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmsub231bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xba,0xd4
-# ATT: vfmsub231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vfmsub231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmsub231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vfmsub231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xba,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmsub231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vfmsub231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vfmsub231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vfmsub231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xba,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmsub231nepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vfmsub231nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vfmsub231bf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vfmsub231bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xba,0x10
-# ATT: vfmsub231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vfmsub231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vfmsub231bf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vfmsub231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xba,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfmsub231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vfmsub231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmsub231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xba,0x51,0x7f
-# ATT: vfmsub231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vfmsub231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfmsub231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xba,0x52,0x80
-# ATT: vfmsub231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vfmsub231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmsub231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vfmsub231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xba,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmsub231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vfmsub231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vfmsub231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vfmsub231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xba,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmsub231nepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vfmsub231nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vfmsub231bf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vfmsub231bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xba,0x10
-# ATT: vfmsub231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vfmsub231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vfmsub231bf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vfmsub231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xba,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfmsub231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vfmsub231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmsub231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xba,0x51,0x7f
-# ATT: vfmsub231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vfmsub231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfmsub231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xba,0x52,0x80
-# ATT: vfmsub231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vfmsub231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfmsub231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vfmsub231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xba,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfmsub231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vfmsub231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vfmsub231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vfmsub231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xba,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfmsub231nepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vfmsub231nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vfmsub231bf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vfmsub231bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xba,0x10
-# ATT: vfmsub231nepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vfmsub231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vfmsub231bf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vfmsub231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xba,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfmsub231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vfmsub231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmsub231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xba,0x51,0x7f
-# ATT: vfmsub231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vfmsub231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfmsub231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xba,0x52,0x80
-# ATT: vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vfnmadd132nepbf16 ymm2, ymm3, ymm4
+# ATT: vfnmadd132bf16 %ymm4, %ymm3, %ymm2
+# INTEL: vfnmadd132bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0x9c,0xd4
-# ATT: vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vfnmadd132nepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vfnmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vfnmadd132bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0x9c,0xd4
-# ATT: vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vfnmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0x9c,0xd4
-# ATT: vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vfnmadd132nepbf16 zmm2, zmm3, zmm4
+# ATT: vfnmadd132bf16 %zmm4, %zmm3, %zmm2
+# INTEL: vfnmadd132bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0x9c,0xd4
-# ATT: vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vfnmadd132nepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vfnmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vfnmadd132bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0x9c,0xd4
-# ATT: vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vfnmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0x9c,0xd4
-# ATT: vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vfnmadd132nepbf16 xmm2, xmm3, xmm4
+# ATT: vfnmadd132bf16 %xmm4, %xmm3, %xmm2
+# INTEL: vfnmadd132bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0x9c,0xd4
-# ATT: vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vfnmadd132nepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vfnmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vfnmadd132bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0x9c,0xd4
-# ATT: vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vfnmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0x9c,0xd4
-# ATT: vfnmadd132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vfnmadd132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmadd132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vfnmadd132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmadd132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vfnmadd132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vfnmadd132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vfnmadd132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmadd132nepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vfnmadd132nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vfnmadd132bf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vfnmadd132bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0x9c,0x10
-# ATT: vfnmadd132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vfnmadd132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vfnmadd132bf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vfnmadd132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0x9c,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfnmadd132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vfnmadd132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0x9c,0x51,0x7f
-# ATT: vfnmadd132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vfnmadd132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0x9c,0x52,0x80
-# ATT: vfnmadd132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vfnmadd132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmadd132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vfnmadd132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmadd132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vfnmadd132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vfnmadd132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vfnmadd132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmadd132nepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vfnmadd132nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vfnmadd132bf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vfnmadd132bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0x9c,0x10
-# ATT: vfnmadd132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vfnmadd132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vfnmadd132bf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vfnmadd132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0x9c,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfnmadd132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vfnmadd132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0x9c,0x51,0x7f
-# ATT: vfnmadd132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vfnmadd132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0x9c,0x52,0x80
-# ATT: vfnmadd132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vfnmadd132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmadd132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vfnmadd132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmadd132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vfnmadd132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vfnmadd132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vfnmadd132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmadd132nepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vfnmadd132nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vfnmadd132bf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vfnmadd132bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0x9c,0x10
-# ATT: vfnmadd132nepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vfnmadd132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vfnmadd132bf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vfnmadd132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0x9c,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfnmadd132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vfnmadd132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0x9c,0x51,0x7f
-# ATT: vfnmadd132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vfnmadd132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0x9c,0x52,0x80
-# ATT: vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vfnmadd213nepbf16 ymm2, ymm3, ymm4
+# ATT: vfnmadd213bf16 %ymm4, %ymm3, %ymm2
+# INTEL: vfnmadd213bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xac,0xd4
-# ATT: vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vfnmadd213nepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vfnmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vfnmadd213bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xac,0xd4
-# ATT: vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vfnmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xac,0xd4
-# ATT: vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vfnmadd213nepbf16 zmm2, zmm3, zmm4
+# ATT: vfnmadd213bf16 %zmm4, %zmm3, %zmm2
+# INTEL: vfnmadd213bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xac,0xd4
-# ATT: vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vfnmadd213nepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vfnmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vfnmadd213bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xac,0xd4
-# ATT: vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vfnmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xac,0xd4
-# ATT: vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vfnmadd213nepbf16 xmm2, xmm3, xmm4
+# ATT: vfnmadd213bf16 %xmm4, %xmm3, %xmm2
+# INTEL: vfnmadd213bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xac,0xd4
-# ATT: vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vfnmadd213nepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vfnmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vfnmadd213bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xac,0xd4
-# ATT: vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vfnmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xac,0xd4
-# ATT: vfnmadd213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vfnmadd213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmadd213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vfnmadd213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xac,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmadd213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vfnmadd213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vfnmadd213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vfnmadd213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xac,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmadd213nepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vfnmadd213nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vfnmadd213bf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vfnmadd213bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xac,0x10
-# ATT: vfnmadd213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vfnmadd213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vfnmadd213bf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vfnmadd213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xac,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfnmadd213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vfnmadd213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xac,0x51,0x7f
-# ATT: vfnmadd213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vfnmadd213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xac,0x52,0x80
-# ATT: vfnmadd213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vfnmadd213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmadd213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vfnmadd213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xac,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmadd213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vfnmadd213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vfnmadd213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vfnmadd213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xac,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmadd213nepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vfnmadd213nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vfnmadd213bf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vfnmadd213bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xac,0x10
-# ATT: vfnmadd213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vfnmadd213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vfnmadd213bf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vfnmadd213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xac,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfnmadd213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vfnmadd213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xac,0x51,0x7f
-# ATT: vfnmadd213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vfnmadd213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xac,0x52,0x80
-# ATT: vfnmadd213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vfnmadd213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmadd213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vfnmadd213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xac,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmadd213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vfnmadd213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vfnmadd213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vfnmadd213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xac,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmadd213nepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vfnmadd213nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vfnmadd213bf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vfnmadd213bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xac,0x10
-# ATT: vfnmadd213nepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vfnmadd213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vfnmadd213bf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vfnmadd213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xac,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfnmadd213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vfnmadd213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xac,0x51,0x7f
-# ATT: vfnmadd213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vfnmadd213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xac,0x52,0x80
-# ATT: vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vfnmadd231nepbf16 ymm2, ymm3, ymm4
+# ATT: vfnmadd231bf16 %ymm4, %ymm3, %ymm2
+# INTEL: vfnmadd231bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xbc,0xd4
-# ATT: vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vfnmadd231nepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vfnmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vfnmadd231bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xbc,0xd4
-# ATT: vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vfnmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xbc,0xd4
-# ATT: vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vfnmadd231nepbf16 zmm2, zmm3, zmm4
+# ATT: vfnmadd231bf16 %zmm4, %zmm3, %zmm2
+# INTEL: vfnmadd231bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xbc,0xd4
-# ATT: vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vfnmadd231nepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vfnmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vfnmadd231bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xbc,0xd4
-# ATT: vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vfnmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xbc,0xd4
-# ATT: vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vfnmadd231nepbf16 xmm2, xmm3, xmm4
+# ATT: vfnmadd231bf16 %xmm4, %xmm3, %xmm2
+# INTEL: vfnmadd231bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xbc,0xd4
-# ATT: vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vfnmadd231nepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vfnmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vfnmadd231bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xbc,0xd4
-# ATT: vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vfnmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xbc,0xd4
-# ATT: vfnmadd231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vfnmadd231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmadd231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vfnmadd231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmadd231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vfnmadd231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vfnmadd231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vfnmadd231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmadd231nepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vfnmadd231nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vfnmadd231bf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vfnmadd231bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xbc,0x10
-# ATT: vfnmadd231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vfnmadd231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vfnmadd231bf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vfnmadd231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xbc,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfnmadd231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vfnmadd231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xbc,0x51,0x7f
-# ATT: vfnmadd231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vfnmadd231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xbc,0x52,0x80
-# ATT: vfnmadd231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vfnmadd231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmadd231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vfnmadd231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmadd231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vfnmadd231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vfnmadd231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vfnmadd231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmadd231nepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vfnmadd231nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vfnmadd231bf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vfnmadd231bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xbc,0x10
-# ATT: vfnmadd231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vfnmadd231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vfnmadd231bf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vfnmadd231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xbc,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfnmadd231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vfnmadd231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xbc,0x51,0x7f
-# ATT: vfnmadd231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vfnmadd231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xbc,0x52,0x80
-# ATT: vfnmadd231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vfnmadd231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmadd231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vfnmadd231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmadd231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vfnmadd231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vfnmadd231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vfnmadd231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmadd231nepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vfnmadd231nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vfnmadd231bf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vfnmadd231bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xbc,0x10
-# ATT: vfnmadd231nepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vfnmadd231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vfnmadd231bf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vfnmadd231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xbc,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfnmadd231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vfnmadd231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xbc,0x51,0x7f
-# ATT: vfnmadd231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vfnmadd231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xbc,0x52,0x80
-# ATT: vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vfnmsub132nepbf16 ymm2, ymm3, ymm4
+# ATT: vfnmsub132bf16 %ymm4, %ymm3, %ymm2
+# INTEL: vfnmsub132bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0x9e,0xd4
-# ATT: vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vfnmsub132nepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vfnmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vfnmsub132bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0x9e,0xd4
-# ATT: vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vfnmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0x9e,0xd4
-# ATT: vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vfnmsub132nepbf16 zmm2, zmm3, zmm4
+# ATT: vfnmsub132bf16 %zmm4, %zmm3, %zmm2
+# INTEL: vfnmsub132bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0x9e,0xd4
-# ATT: vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vfnmsub132nepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vfnmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vfnmsub132bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0x9e,0xd4
-# ATT: vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vfnmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0x9e,0xd4
-# ATT: vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vfnmsub132nepbf16 xmm2, xmm3, xmm4
+# ATT: vfnmsub132bf16 %xmm4, %xmm3, %xmm2
+# INTEL: vfnmsub132bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0x9e,0xd4
-# ATT: vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vfnmsub132nepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vfnmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vfnmsub132bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0x9e,0xd4
-# ATT: vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vfnmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0x9e,0xd4
-# ATT: vfnmsub132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vfnmsub132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmsub132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vfnmsub132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmsub132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vfnmsub132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vfnmsub132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vfnmsub132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmsub132nepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vfnmsub132nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vfnmsub132bf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vfnmsub132bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0x9e,0x10
-# ATT: vfnmsub132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vfnmsub132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vfnmsub132bf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vfnmsub132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0x9e,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfnmsub132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vfnmsub132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0x9e,0x51,0x7f
-# ATT: vfnmsub132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vfnmsub132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0x9e,0x52,0x80
-# ATT: vfnmsub132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vfnmsub132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmsub132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vfnmsub132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmsub132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vfnmsub132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vfnmsub132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vfnmsub132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmsub132nepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vfnmsub132nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vfnmsub132bf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vfnmsub132bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0x9e,0x10
-# ATT: vfnmsub132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vfnmsub132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vfnmsub132bf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vfnmsub132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0x9e,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfnmsub132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vfnmsub132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0x9e,0x51,0x7f
-# ATT: vfnmsub132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vfnmsub132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0x9e,0x52,0x80
-# ATT: vfnmsub132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vfnmsub132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmsub132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vfnmsub132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmsub132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vfnmsub132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vfnmsub132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vfnmsub132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmsub132nepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vfnmsub132nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vfnmsub132bf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vfnmsub132bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0x9e,0x10
-# ATT: vfnmsub132nepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vfnmsub132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vfnmsub132bf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vfnmsub132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0x9e,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfnmsub132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vfnmsub132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0x9e,0x51,0x7f
-# ATT: vfnmsub132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vfnmsub132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0x9e,0x52,0x80
-# ATT: vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vfnmsub213nepbf16 ymm2, ymm3, ymm4
+# ATT: vfnmsub213bf16 %ymm4, %ymm3, %ymm2
+# INTEL: vfnmsub213bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xae,0xd4
-# ATT: vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vfnmsub213nepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vfnmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vfnmsub213bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xae,0xd4
-# ATT: vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vfnmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xae,0xd4
-# ATT: vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vfnmsub213nepbf16 zmm2, zmm3, zmm4
+# ATT: vfnmsub213bf16 %zmm4, %zmm3, %zmm2
+# INTEL: vfnmsub213bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xae,0xd4
-# ATT: vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vfnmsub213nepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vfnmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vfnmsub213bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xae,0xd4
-# ATT: vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vfnmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xae,0xd4
-# ATT: vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vfnmsub213nepbf16 xmm2, xmm3, xmm4
+# ATT: vfnmsub213bf16 %xmm4, %xmm3, %xmm2
+# INTEL: vfnmsub213bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xae,0xd4
-# ATT: vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vfnmsub213nepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vfnmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vfnmsub213bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xae,0xd4
-# ATT: vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vfnmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xae,0xd4
-# ATT: vfnmsub213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vfnmsub213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmsub213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vfnmsub213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xae,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmsub213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vfnmsub213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vfnmsub213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vfnmsub213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xae,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmsub213nepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vfnmsub213nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vfnmsub213bf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vfnmsub213bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xae,0x10
-# ATT: vfnmsub213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vfnmsub213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vfnmsub213bf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vfnmsub213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xae,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfnmsub213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vfnmsub213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xae,0x51,0x7f
-# ATT: vfnmsub213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vfnmsub213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xae,0x52,0x80
-# ATT: vfnmsub213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vfnmsub213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmsub213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vfnmsub213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xae,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmsub213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vfnmsub213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vfnmsub213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vfnmsub213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xae,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmsub213nepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vfnmsub213nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vfnmsub213bf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vfnmsub213bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xae,0x10
-# ATT: vfnmsub213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vfnmsub213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vfnmsub213bf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vfnmsub213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xae,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfnmsub213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vfnmsub213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xae,0x51,0x7f
-# ATT: vfnmsub213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vfnmsub213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xae,0x52,0x80
-# ATT: vfnmsub213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vfnmsub213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmsub213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vfnmsub213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xae,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmsub213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vfnmsub213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vfnmsub213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vfnmsub213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xae,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmsub213nepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vfnmsub213nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vfnmsub213bf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vfnmsub213bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xae,0x10
-# ATT: vfnmsub213nepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vfnmsub213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vfnmsub213bf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vfnmsub213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xae,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfnmsub213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vfnmsub213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xae,0x51,0x7f
-# ATT: vfnmsub213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vfnmsub213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xae,0x52,0x80
-# ATT: vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vfnmsub231nepbf16 ymm2, ymm3, ymm4
+# ATT: vfnmsub231bf16 %ymm4, %ymm3, %ymm2
+# INTEL: vfnmsub231bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xbe,0xd4
-# ATT: vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vfnmsub231nepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vfnmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vfnmsub231bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xbe,0xd4
-# ATT: vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vfnmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xbe,0xd4
-# ATT: vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vfnmsub231nepbf16 zmm2, zmm3, zmm4
+# ATT: vfnmsub231bf16 %zmm4, %zmm3, %zmm2
+# INTEL: vfnmsub231bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xbe,0xd4
-# ATT: vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vfnmsub231nepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vfnmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vfnmsub231bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xbe,0xd4
-# ATT: vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vfnmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xbe,0xd4
-# ATT: vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vfnmsub231nepbf16 xmm2, xmm3, xmm4
+# ATT: vfnmsub231bf16 %xmm4, %xmm3, %xmm2
+# INTEL: vfnmsub231bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xbe,0xd4
-# ATT: vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vfnmsub231nepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vfnmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vfnmsub231bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xbe,0xd4
-# ATT: vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vfnmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xbe,0xd4
-# ATT: vfnmsub231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vfnmsub231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmsub231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vfnmsub231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmsub231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vfnmsub231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vfnmsub231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vfnmsub231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmsub231nepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vfnmsub231nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vfnmsub231bf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vfnmsub231bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xbe,0x10
-# ATT: vfnmsub231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vfnmsub231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vfnmsub231bf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vfnmsub231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xbe,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfnmsub231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vfnmsub231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xbe,0x51,0x7f
-# ATT: vfnmsub231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vfnmsub231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xbe,0x52,0x80
-# ATT: vfnmsub231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vfnmsub231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmsub231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vfnmsub231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmsub231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vfnmsub231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vfnmsub231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vfnmsub231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmsub231nepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vfnmsub231nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vfnmsub231bf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vfnmsub231bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xbe,0x10
-# ATT: vfnmsub231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vfnmsub231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vfnmsub231bf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vfnmsub231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xbe,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfnmsub231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vfnmsub231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xbe,0x51,0x7f
-# ATT: vfnmsub231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vfnmsub231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xbe,0x52,0x80
-# ATT: vfnmsub231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vfnmsub231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vfnmsub231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vfnmsub231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vfnmsub231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vfnmsub231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vfnmsub231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vfnmsub231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vfnmsub231nepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vfnmsub231nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vfnmsub231bf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vfnmsub231bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xbe,0x10
-# ATT: vfnmsub231nepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vfnmsub231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vfnmsub231bf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vfnmsub231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xbe,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfnmsub231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vfnmsub231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xbe,0x51,0x7f
-# ATT: vfnmsub231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vfnmsub231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xbe,0x52,0x80
-# ATT: vfpclasspbf16 $123, %zmm3, %k5
-# INTEL: vfpclasspbf16 k5, zmm3, 123
+# ATT: vfpclassbf16 $123, %zmm3, %k5
+# INTEL: vfpclassbf16 k5, zmm3, 123
0x62,0xf3,0x7f,0x48,0x66,0xeb,0x7b
-# ATT: vfpclasspbf16 $123, %zmm3, %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, zmm3, 123
+# ATT: vfpclassbf16 $123, %zmm3, %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, zmm3, 123
0x62,0xf3,0x7f,0x4f,0x66,0xeb,0x7b
-# ATT: vfpclasspbf16 $123, %ymm3, %k5
-# INTEL: vfpclasspbf16 k5, ymm3, 123
+# ATT: vfpclassbf16 $123, %ymm3, %k5
+# INTEL: vfpclassbf16 k5, ymm3, 123
0x62,0xf3,0x7f,0x28,0x66,0xeb,0x7b
-# ATT: vfpclasspbf16 $123, %ymm3, %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, ymm3, 123
+# ATT: vfpclassbf16 $123, %ymm3, %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, ymm3, 123
0x62,0xf3,0x7f,0x2f,0x66,0xeb,0x7b
-# ATT: vfpclasspbf16 $123, %xmm3, %k5
-# INTEL: vfpclasspbf16 k5, xmm3, 123
+# ATT: vfpclassbf16 $123, %xmm3, %k5
+# INTEL: vfpclassbf16 k5, xmm3, 123
0x62,0xf3,0x7f,0x08,0x66,0xeb,0x7b
-# ATT: vfpclasspbf16 $123, %xmm3, %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, xmm3, 123
+# ATT: vfpclassbf16 $123, %xmm3, %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, xmm3, 123
0x62,0xf3,0x7f,0x0f,0x66,0xeb,0x7b
-# ATT: vfpclasspbf16x $123, 268435456(%esp,%esi,8), %k5
-# INTEL: vfpclasspbf16 k5, xmmword ptr [esp + 8*esi + 268435456], 123
+# ATT: vfpclassbf16x $123, 268435456(%esp,%esi,8), %k5
+# INTEL: vfpclassbf16 k5, xmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x08,0x66,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b
-# ATT: vfpclasspbf16x $123, 291(%edi,%eax,4), %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, xmmword ptr [edi + 4*eax + 291], 123
+# ATT: vfpclassbf16x $123, 291(%edi,%eax,4), %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, xmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x0f,0x66,0xac,0x87,0x23,0x01,0x00,0x00,0x7b
-# ATT: vfpclasspbf16 $123, (%eax){1to8}, %k5
-# INTEL: vfpclasspbf16 k5, word ptr [eax]{1to8}, 123
+# ATT: vfpclassbf16 $123, (%eax){1to8}, %k5
+# INTEL: vfpclassbf16 k5, word ptr [eax]{1to8}, 123
0x62,0xf3,0x7f,0x18,0x66,0x28,0x7b
-# ATT: vfpclasspbf16x $123, -512(,%ebp,2), %k5
-# INTEL: vfpclasspbf16 k5, xmmword ptr [2*ebp - 512], 123
+# ATT: vfpclassbf16x $123, -512(,%ebp,2), %k5
+# INTEL: vfpclassbf16 k5, xmmword ptr [2*ebp - 512], 123
0x62,0xf3,0x7f,0x08,0x66,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b
-# ATT: vfpclasspbf16x $123, 2032(%ecx), %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, xmmword ptr [ecx + 2032], 123
+# ATT: vfpclassbf16x $123, 2032(%ecx), %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, xmmword ptr [ecx + 2032], 123
0x62,0xf3,0x7f,0x0f,0x66,0x69,0x7f,0x7b
-# ATT: vfpclasspbf16 $123, -256(%edx){1to8}, %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to8}, 123
+# ATT: vfpclassbf16 $123, -256(%edx){1to8}, %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to8}, 123
0x62,0xf3,0x7f,0x1f,0x66,0x6a,0x80,0x7b
-# ATT: vfpclasspbf16 $123, (%eax){1to16}, %k5
-# INTEL: vfpclasspbf16 k5, word ptr [eax]{1to16}, 123
+# ATT: vfpclassbf16 $123, (%eax){1to16}, %k5
+# INTEL: vfpclassbf16 k5, word ptr [eax]{1to16}, 123
0x62,0xf3,0x7f,0x38,0x66,0x28,0x7b
-# ATT: vfpclasspbf16y $123, -1024(,%ebp,2), %k5
-# INTEL: vfpclasspbf16 k5, ymmword ptr [2*ebp - 1024], 123
+# ATT: vfpclassbf16y $123, -1024(,%ebp,2), %k5
+# INTEL: vfpclassbf16 k5, ymmword ptr [2*ebp - 1024], 123
0x62,0xf3,0x7f,0x28,0x66,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b
-# ATT: vfpclasspbf16y $123, 4064(%ecx), %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, ymmword ptr [ecx + 4064], 123
+# ATT: vfpclassbf16y $123, 4064(%ecx), %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, ymmword ptr [ecx + 4064], 123
0x62,0xf3,0x7f,0x2f,0x66,0x69,0x7f,0x7b
-# ATT: vfpclasspbf16 $123, -256(%edx){1to16}, %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to16}, 123
+# ATT: vfpclassbf16 $123, -256(%edx){1to16}, %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to16}, 123
0x62,0xf3,0x7f,0x3f,0x66,0x6a,0x80,0x7b
-# ATT: vfpclasspbf16 $123, (%eax){1to32}, %k5
-# INTEL: vfpclasspbf16 k5, word ptr [eax]{1to32}, 123
+# ATT: vfpclassbf16 $123, (%eax){1to32}, %k5
+# INTEL: vfpclassbf16 k5, word ptr [eax]{1to32}, 123
0x62,0xf3,0x7f,0x58,0x66,0x28,0x7b
-# ATT: vfpclasspbf16z $123, -2048(,%ebp,2), %k5
-# INTEL: vfpclasspbf16 k5, zmmword ptr [2*ebp - 2048], 123
+# ATT: vfpclassbf16z $123, -2048(,%ebp,2), %k5
+# INTEL: vfpclassbf16 k5, zmmword ptr [2*ebp - 2048], 123
0x62,0xf3,0x7f,0x48,0x66,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b
-# ATT: vfpclasspbf16z $123, 8128(%ecx), %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, zmmword ptr [ecx + 8128], 123
+# ATT: vfpclassbf16z $123, 8128(%ecx), %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, zmmword ptr [ecx + 8128], 123
0x62,0xf3,0x7f,0x4f,0x66,0x69,0x7f,0x7b
-# ATT: vfpclasspbf16 $123, -256(%edx){1to32}, %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to32}, 123
+# ATT: vfpclassbf16 $123, -256(%edx){1to32}, %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to32}, 123
0x62,0xf3,0x7f,0x5f,0x66,0x6a,0x80,0x7b
-# ATT: vgetexppbf16 %xmm3, %xmm2
-# INTEL: vgetexppbf16 xmm2, xmm3
+# ATT: vgetexpbf16 %xmm3, %xmm2
+# INTEL: vgetexpbf16 xmm2, xmm3
0x62,0xf5,0x7d,0x08,0x42,0xd3
-# ATT: vgetexppbf16 %xmm3, %xmm2 {%k7}
-# INTEL: vgetexppbf16 xmm2 {k7}, xmm3
+# ATT: vgetexpbf16 %xmm3, %xmm2 {%k7}
+# INTEL: vgetexpbf16 xmm2 {k7}, xmm3
0x62,0xf5,0x7d,0x0f,0x42,0xd3
-# ATT: vgetexppbf16 %xmm3, %xmm2 {%k7} {z}
-# INTEL: vgetexppbf16 xmm2 {k7} {z}, xmm3
+# ATT: vgetexpbf16 %xmm3, %xmm2 {%k7} {z}
+# INTEL: vgetexpbf16 xmm2 {k7} {z}, xmm3
0x62,0xf5,0x7d,0x8f,0x42,0xd3
-# ATT: vgetexppbf16 %zmm3, %zmm2
-# INTEL: vgetexppbf16 zmm2, zmm3
+# ATT: vgetexpbf16 %zmm3, %zmm2
+# INTEL: vgetexpbf16 zmm2, zmm3
0x62,0xf5,0x7d,0x48,0x42,0xd3
-# ATT: vgetexppbf16 %zmm3, %zmm2 {%k7}
-# INTEL: vgetexppbf16 zmm2 {k7}, zmm3
+# ATT: vgetexpbf16 %zmm3, %zmm2 {%k7}
+# INTEL: vgetexpbf16 zmm2 {k7}, zmm3
0x62,0xf5,0x7d,0x4f,0x42,0xd3
-# ATT: vgetexppbf16 %zmm3, %zmm2 {%k7} {z}
-# INTEL: vgetexppbf16 zmm2 {k7} {z}, zmm3
+# ATT: vgetexpbf16 %zmm3, %zmm2 {%k7} {z}
+# INTEL: vgetexpbf16 zmm2 {k7} {z}, zmm3
0x62,0xf5,0x7d,0xcf,0x42,0xd3
-# ATT: vgetexppbf16 %ymm3, %ymm2
-# INTEL: vgetexppbf16 ymm2, ymm3
+# ATT: vgetexpbf16 %ymm3, %ymm2
+# INTEL: vgetexpbf16 ymm2, ymm3
0x62,0xf5,0x7d,0x28,0x42,0xd3
-# ATT: vgetexppbf16 %ymm3, %ymm2 {%k7}
-# INTEL: vgetexppbf16 ymm2 {k7}, ymm3
+# ATT: vgetexpbf16 %ymm3, %ymm2 {%k7}
+# INTEL: vgetexpbf16 ymm2 {k7}, ymm3
0x62,0xf5,0x7d,0x2f,0x42,0xd3
-# ATT: vgetexppbf16 %ymm3, %ymm2 {%k7} {z}
-# INTEL: vgetexppbf16 ymm2 {k7} {z}, ymm3
+# ATT: vgetexpbf16 %ymm3, %ymm2 {%k7} {z}
+# INTEL: vgetexpbf16 ymm2 {k7} {z}, ymm3
0x62,0xf5,0x7d,0xaf,0x42,0xd3
-# ATT: vgetexppbf16 268435456(%esp,%esi,8), %xmm2
-# INTEL: vgetexppbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vgetexpbf16 268435456(%esp,%esi,8), %xmm2
+# INTEL: vgetexpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x7d,0x08,0x42,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vgetexppbf16 291(%edi,%eax,4), %xmm2 {%k7}
-# INTEL: vgetexppbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
+# ATT: vgetexpbf16 291(%edi,%eax,4), %xmm2 {%k7}
+# INTEL: vgetexpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x7d,0x0f,0x42,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vgetexppbf16 (%eax){1to8}, %xmm2
-# INTEL: vgetexppbf16 xmm2, word ptr [eax]{1to8}
+# ATT: vgetexpbf16 (%eax){1to8}, %xmm2
+# INTEL: vgetexpbf16 xmm2, word ptr [eax]{1to8}
0x62,0xf5,0x7d,0x18,0x42,0x10
-# ATT: vgetexppbf16 -512(,%ebp,2), %xmm2
-# INTEL: vgetexppbf16 xmm2, xmmword ptr [2*ebp - 512]
+# ATT: vgetexpbf16 -512(,%ebp,2), %xmm2
+# INTEL: vgetexpbf16 xmm2, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x7d,0x08,0x42,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vgetexppbf16 2032(%ecx), %xmm2 {%k7} {z}
-# INTEL: vgetexppbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
+# ATT: vgetexpbf16 2032(%ecx), %xmm2 {%k7} {z}
+# INTEL: vgetexpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
0x62,0xf5,0x7d,0x8f,0x42,0x51,0x7f
-# ATT: vgetexppbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
-# INTEL: vgetexppbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
+# ATT: vgetexpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
+# INTEL: vgetexpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
0x62,0xf5,0x7d,0x9f,0x42,0x52,0x80
-# ATT: vgetexppbf16 268435456(%esp,%esi,8), %ymm2
-# INTEL: vgetexppbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vgetexpbf16 268435456(%esp,%esi,8), %ymm2
+# INTEL: vgetexpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x7d,0x28,0x42,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vgetexppbf16 291(%edi,%eax,4), %ymm2 {%k7}
-# INTEL: vgetexppbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
+# ATT: vgetexpbf16 291(%edi,%eax,4), %ymm2 {%k7}
+# INTEL: vgetexpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x7d,0x2f,0x42,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vgetexppbf16 (%eax){1to16}, %ymm2
-# INTEL: vgetexppbf16 ymm2, word ptr [eax]{1to16}
+# ATT: vgetexpbf16 (%eax){1to16}, %ymm2
+# INTEL: vgetexpbf16 ymm2, word ptr [eax]{1to16}
0x62,0xf5,0x7d,0x38,0x42,0x10
-# ATT: vgetexppbf16 -1024(,%ebp,2), %ymm2
-# INTEL: vgetexppbf16 ymm2, ymmword ptr [2*ebp - 1024]
+# ATT: vgetexpbf16 -1024(,%ebp,2), %ymm2
+# INTEL: vgetexpbf16 ymm2, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x7d,0x28,0x42,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vgetexppbf16 4064(%ecx), %ymm2 {%k7} {z}
-# INTEL: vgetexppbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
+# ATT: vgetexpbf16 4064(%ecx), %ymm2 {%k7} {z}
+# INTEL: vgetexpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
0x62,0xf5,0x7d,0xaf,0x42,0x51,0x7f
-# ATT: vgetexppbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
-# INTEL: vgetexppbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
+# ATT: vgetexpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
+# INTEL: vgetexpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
0x62,0xf5,0x7d,0xbf,0x42,0x52,0x80
-# ATT: vgetexppbf16 268435456(%esp,%esi,8), %zmm2
-# INTEL: vgetexppbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vgetexpbf16 268435456(%esp,%esi,8), %zmm2
+# INTEL: vgetexpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x7d,0x48,0x42,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vgetexppbf16 291(%edi,%eax,4), %zmm2 {%k7}
-# INTEL: vgetexppbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
+# ATT: vgetexpbf16 291(%edi,%eax,4), %zmm2 {%k7}
+# INTEL: vgetexpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x7d,0x4f,0x42,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vgetexppbf16 (%eax){1to32}, %zmm2
-# INTEL: vgetexppbf16 zmm2, word ptr [eax]{1to32}
+# ATT: vgetexpbf16 (%eax){1to32}, %zmm2
+# INTEL: vgetexpbf16 zmm2, word ptr [eax]{1to32}
0x62,0xf5,0x7d,0x58,0x42,0x10
-# ATT: vgetexppbf16 -2048(,%ebp,2), %zmm2
-# INTEL: vgetexppbf16 zmm2, zmmword ptr [2*ebp - 2048]
+# ATT: vgetexpbf16 -2048(,%ebp,2), %zmm2
+# INTEL: vgetexpbf16 zmm2, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x7d,0x48,0x42,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vgetexppbf16 8128(%ecx), %zmm2 {%k7} {z}
-# INTEL: vgetexppbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
+# ATT: vgetexpbf16 8128(%ecx), %zmm2 {%k7} {z}
+# INTEL: vgetexpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
0x62,0xf5,0x7d,0xcf,0x42,0x51,0x7f
-# ATT: vgetexppbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
-# INTEL: vgetexppbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
+# ATT: vgetexpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
+# INTEL: vgetexpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
0x62,0xf5,0x7d,0xdf,0x42,0x52,0x80
-# ATT: vgetmantpbf16 $123, %zmm3, %zmm2
-# INTEL: vgetmantpbf16 zmm2, zmm3, 123
+# ATT: vgetmantbf16 $123, %zmm3, %zmm2
+# INTEL: vgetmantbf16 zmm2, zmm3, 123
0x62,0xf3,0x7f,0x48,0x26,0xd3,0x7b
-# ATT: vgetmantpbf16 $123, %zmm3, %zmm2 {%k7}
-# INTEL: vgetmantpbf16 zmm2 {k7}, zmm3, 123
+# ATT: vgetmantbf16 $123, %zmm3, %zmm2 {%k7}
+# INTEL: vgetmantbf16 zmm2 {k7}, zmm3, 123
0x62,0xf3,0x7f,0x4f,0x26,0xd3,0x7b
-# ATT: vgetmantpbf16 $123, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vgetmantpbf16 zmm2 {k7} {z}, zmm3, 123
+# ATT: vgetmantbf16 $123, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vgetmantbf16 zmm2 {k7} {z}, zmm3, 123
0x62,0xf3,0x7f,0xcf,0x26,0xd3,0x7b
-# ATT: vgetmantpbf16 $123, %ymm3, %ymm2
-# INTEL: vgetmantpbf16 ymm2, ymm3, 123
+# ATT: vgetmantbf16 $123, %ymm3, %ymm2
+# INTEL: vgetmantbf16 ymm2, ymm3, 123
0x62,0xf3,0x7f,0x28,0x26,0xd3,0x7b
-# ATT: vgetmantpbf16 $123, %ymm3, %ymm2 {%k7}
-# INTEL: vgetmantpbf16 ymm2 {k7}, ymm3, 123
+# ATT: vgetmantbf16 $123, %ymm3, %ymm2 {%k7}
+# INTEL: vgetmantbf16 ymm2 {k7}, ymm3, 123
0x62,0xf3,0x7f,0x2f,0x26,0xd3,0x7b
-# ATT: vgetmantpbf16 $123, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vgetmantpbf16 ymm2 {k7} {z}, ymm3, 123
+# ATT: vgetmantbf16 $123, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vgetmantbf16 ymm2 {k7} {z}, ymm3, 123
0x62,0xf3,0x7f,0xaf,0x26,0xd3,0x7b
-# ATT: vgetmantpbf16 $123, %xmm3, %xmm2
-# INTEL: vgetmantpbf16 xmm2, xmm3, 123
+# ATT: vgetmantbf16 $123, %xmm3, %xmm2
+# INTEL: vgetmantbf16 xmm2, xmm3, 123
0x62,0xf3,0x7f,0x08,0x26,0xd3,0x7b
-# ATT: vgetmantpbf16 $123, %xmm3, %xmm2 {%k7}
-# INTEL: vgetmantpbf16 xmm2 {k7}, xmm3, 123
+# ATT: vgetmantbf16 $123, %xmm3, %xmm2 {%k7}
+# INTEL: vgetmantbf16 xmm2 {k7}, xmm3, 123
0x62,0xf3,0x7f,0x0f,0x26,0xd3,0x7b
-# ATT: vgetmantpbf16 $123, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vgetmantpbf16 xmm2 {k7} {z}, xmm3, 123
+# ATT: vgetmantbf16 $123, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vgetmantbf16 xmm2 {k7} {z}, xmm3, 123
0x62,0xf3,0x7f,0x8f,0x26,0xd3,0x7b
-# ATT: vgetmantpbf16 $123, 268435456(%esp,%esi,8), %xmm2
-# INTEL: vgetmantpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
+# ATT: vgetmantbf16 $123, 268435456(%esp,%esi,8), %xmm2
+# INTEL: vgetmantbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x08,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b
-# ATT: vgetmantpbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
-# INTEL: vgetmantpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
+# ATT: vgetmantbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
+# INTEL: vgetmantbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x0f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b
-# ATT: vgetmantpbf16 $123, (%eax){1to8}, %xmm2
-# INTEL: vgetmantpbf16 xmm2, word ptr [eax]{1to8}, 123
+# ATT: vgetmantbf16 $123, (%eax){1to8}, %xmm2
+# INTEL: vgetmantbf16 xmm2, word ptr [eax]{1to8}, 123
0x62,0xf3,0x7f,0x18,0x26,0x10,0x7b
-# ATT: vgetmantpbf16 $123, -512(,%ebp,2), %xmm2
-# INTEL: vgetmantpbf16 xmm2, xmmword ptr [2*ebp - 512], 123
+# ATT: vgetmantbf16 $123, -512(,%ebp,2), %xmm2
+# INTEL: vgetmantbf16 xmm2, xmmword ptr [2*ebp - 512], 123
0x62,0xf3,0x7f,0x08,0x26,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b
-# ATT: vgetmantpbf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
-# INTEL: vgetmantpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
+# ATT: vgetmantbf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
+# INTEL: vgetmantbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
0x62,0xf3,0x7f,0x8f,0x26,0x51,0x7f,0x7b
-# ATT: vgetmantpbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
-# INTEL: vgetmantpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
+# ATT: vgetmantbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
+# INTEL: vgetmantbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
0x62,0xf3,0x7f,0x9f,0x26,0x52,0x80,0x7b
-# ATT: vgetmantpbf16 $123, 268435456(%esp,%esi,8), %ymm2
-# INTEL: vgetmantpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
+# ATT: vgetmantbf16 $123, 268435456(%esp,%esi,8), %ymm2
+# INTEL: vgetmantbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x28,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b
-# ATT: vgetmantpbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
-# INTEL: vgetmantpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
+# ATT: vgetmantbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
+# INTEL: vgetmantbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x2f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b
-# ATT: vgetmantpbf16 $123, (%eax){1to16}, %ymm2
-# INTEL: vgetmantpbf16 ymm2, word ptr [eax]{1to16}, 123
+# ATT: vgetmantbf16 $123, (%eax){1to16}, %ymm2
+# INTEL: vgetmantbf16 ymm2, word ptr [eax]{1to16}, 123
0x62,0xf3,0x7f,0x38,0x26,0x10,0x7b
-# ATT: vgetmantpbf16 $123, -1024(,%ebp,2), %ymm2
-# INTEL: vgetmantpbf16 ymm2, ymmword ptr [2*ebp - 1024], 123
+# ATT: vgetmantbf16 $123, -1024(,%ebp,2), %ymm2
+# INTEL: vgetmantbf16 ymm2, ymmword ptr [2*ebp - 1024], 123
0x62,0xf3,0x7f,0x28,0x26,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b
-# ATT: vgetmantpbf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
-# INTEL: vgetmantpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
+# ATT: vgetmantbf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
+# INTEL: vgetmantbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
0x62,0xf3,0x7f,0xaf,0x26,0x51,0x7f,0x7b
-# ATT: vgetmantpbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
-# INTEL: vgetmantpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
+# ATT: vgetmantbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
+# INTEL: vgetmantbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
0x62,0xf3,0x7f,0xbf,0x26,0x52,0x80,0x7b
-# ATT: vgetmantpbf16 $123, 268435456(%esp,%esi,8), %zmm2
-# INTEL: vgetmantpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
+# ATT: vgetmantbf16 $123, 268435456(%esp,%esi,8), %zmm2
+# INTEL: vgetmantbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x48,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b
-# ATT: vgetmantpbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
-# INTEL: vgetmantpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
+# ATT: vgetmantbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
+# INTEL: vgetmantbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x4f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b
-# ATT: vgetmantpbf16 $123, (%eax){1to32}, %zmm2
-# INTEL: vgetmantpbf16 zmm2, word ptr [eax]{1to32}, 123
+# ATT: vgetmantbf16 $123, (%eax){1to32}, %zmm2
+# INTEL: vgetmantbf16 zmm2, word ptr [eax]{1to32}, 123
0x62,0xf3,0x7f,0x58,0x26,0x10,0x7b
-# ATT: vgetmantpbf16 $123, -2048(,%ebp,2), %zmm2
-# INTEL: vgetmantpbf16 zmm2, zmmword ptr [2*ebp - 2048], 123
+# ATT: vgetmantbf16 $123, -2048(,%ebp,2), %zmm2
+# INTEL: vgetmantbf16 zmm2, zmmword ptr [2*ebp - 2048], 123
0x62,0xf3,0x7f,0x48,0x26,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b
-# ATT: vgetmantpbf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
-# INTEL: vgetmantpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
+# ATT: vgetmantbf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
+# INTEL: vgetmantbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
0x62,0xf3,0x7f,0xcf,0x26,0x51,0x7f,0x7b
-# ATT: vgetmantpbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
-# INTEL: vgetmantpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
+# ATT: vgetmantbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
+# INTEL: vgetmantbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
0x62,0xf3,0x7f,0xdf,0x26,0x52,0x80,0x7b
-# ATT: vmaxpbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vmaxpbf16 ymm2, ymm3, ymm4
+# ATT: vmaxbf16 %ymm4, %ymm3, %ymm2
+# INTEL: vmaxbf16 ymm2, ymm3, ymm4
0x62,0xf5,0x65,0x28,0x5f,0xd4
-# ATT: vmaxpbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vmaxpbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vmaxbf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vmaxbf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf5,0x65,0x2f,0x5f,0xd4
-# ATT: vmaxpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vmaxpbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vmaxbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vmaxbf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf5,0x65,0xaf,0x5f,0xd4
-# ATT: vmaxpbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vmaxpbf16 zmm2, zmm3, zmm4
+# ATT: vmaxbf16 %zmm4, %zmm3, %zmm2
+# INTEL: vmaxbf16 zmm2, zmm3, zmm4
0x62,0xf5,0x65,0x48,0x5f,0xd4
-# ATT: vmaxpbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vmaxpbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vmaxbf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vmaxbf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf5,0x65,0x4f,0x5f,0xd4
-# ATT: vmaxpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vmaxpbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vmaxbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vmaxbf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf5,0x65,0xcf,0x5f,0xd4
-# ATT: vmaxpbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vmaxpbf16 xmm2, xmm3, xmm4
+# ATT: vmaxbf16 %xmm4, %xmm3, %xmm2
+# INTEL: vmaxbf16 xmm2, xmm3, xmm4
0x62,0xf5,0x65,0x08,0x5f,0xd4
-# ATT: vmaxpbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vmaxpbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vmaxbf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vmaxbf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf5,0x65,0x0f,0x5f,0xd4
-# ATT: vmaxpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vmaxpbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vmaxbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vmaxbf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf5,0x65,0x8f,0x5f,0xd4
-# ATT: vmaxpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vmaxpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vmaxbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vmaxbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x48,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vmaxpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vmaxpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vmaxbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vmaxbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x4f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vmaxpbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vmaxpbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vmaxbf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vmaxbf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf5,0x65,0x58,0x5f,0x10
-# ATT: vmaxpbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vmaxpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vmaxbf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vmaxbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x65,0x48,0x5f,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vmaxpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vmaxpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vmaxbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vmaxbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf5,0x65,0xcf,0x5f,0x51,0x7f
-# ATT: vmaxpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vmaxpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vmaxbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vmaxbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf5,0x65,0xdf,0x5f,0x52,0x80
-# ATT: vmaxpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vmaxpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vmaxbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vmaxbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x28,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vmaxpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vmaxpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vmaxbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vmaxbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x2f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vmaxpbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vmaxpbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vmaxbf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vmaxbf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf5,0x65,0x38,0x5f,0x10
-# ATT: vmaxpbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vmaxpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vmaxbf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vmaxbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x65,0x28,0x5f,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vmaxpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vmaxpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vmaxbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vmaxbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf5,0x65,0xaf,0x5f,0x51,0x7f
-# ATT: vmaxpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vmaxpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vmaxbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vmaxbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf5,0x65,0xbf,0x5f,0x52,0x80
-# ATT: vmaxpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vmaxpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vmaxbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vmaxbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x08,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vmaxpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vmaxpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vmaxbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vmaxbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x0f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vmaxpbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vmaxpbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vmaxbf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vmaxbf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf5,0x65,0x18,0x5f,0x10
-# ATT: vmaxpbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vmaxpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vmaxbf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vmaxbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x65,0x08,0x5f,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vmaxpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vmaxpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vmaxbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vmaxbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf5,0x65,0x8f,0x5f,0x51,0x7f
-# ATT: vmaxpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vmaxpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vmaxbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vmaxbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf5,0x65,0x9f,0x5f,0x52,0x80
-# ATT: vminpbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vminpbf16 ymm2, ymm3, ymm4
+# ATT: vminbf16 %ymm4, %ymm3, %ymm2
+# INTEL: vminbf16 ymm2, ymm3, ymm4
0x62,0xf5,0x65,0x28,0x5d,0xd4
-# ATT: vminpbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vminpbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vminbf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vminbf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf5,0x65,0x2f,0x5d,0xd4
-# ATT: vminpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vminpbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vminbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vminbf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf5,0x65,0xaf,0x5d,0xd4
-# ATT: vminpbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vminpbf16 zmm2, zmm3, zmm4
+# ATT: vminbf16 %zmm4, %zmm3, %zmm2
+# INTEL: vminbf16 zmm2, zmm3, zmm4
0x62,0xf5,0x65,0x48,0x5d,0xd4
-# ATT: vminpbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vminpbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vminbf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vminbf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf5,0x65,0x4f,0x5d,0xd4
-# ATT: vminpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vminpbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vminbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vminbf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf5,0x65,0xcf,0x5d,0xd4
-# ATT: vminpbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vminpbf16 xmm2, xmm3, xmm4
+# ATT: vminbf16 %xmm4, %xmm3, %xmm2
+# INTEL: vminbf16 xmm2, xmm3, xmm4
0x62,0xf5,0x65,0x08,0x5d,0xd4
-# ATT: vminpbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vminpbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vminbf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vminbf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf5,0x65,0x0f,0x5d,0xd4
-# ATT: vminpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vminpbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vminbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vminbf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf5,0x65,0x8f,0x5d,0xd4
-# ATT: vminpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vminpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vminbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vminbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x48,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vminpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vminpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vminbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vminbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x4f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vminpbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vminpbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vminbf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vminbf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf5,0x65,0x58,0x5d,0x10
-# ATT: vminpbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vminpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vminbf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vminbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x65,0x48,0x5d,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vminpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vminpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vminbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vminbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf5,0x65,0xcf,0x5d,0x51,0x7f
-# ATT: vminpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vminpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vminbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vminbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf5,0x65,0xdf,0x5d,0x52,0x80
-# ATT: vminpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vminpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vminbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vminbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x28,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vminpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vminpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vminbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vminbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x2f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vminpbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vminpbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vminbf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vminbf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf5,0x65,0x38,0x5d,0x10
-# ATT: vminpbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vminpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vminbf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vminbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x65,0x28,0x5d,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vminpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vminpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vminbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vminbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf5,0x65,0xaf,0x5d,0x51,0x7f
-# ATT: vminpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vminpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vminbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vminbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf5,0x65,0xbf,0x5d,0x52,0x80
-# ATT: vminpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vminpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vminbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vminbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x08,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vminpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vminpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vminbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vminbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x0f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vminpbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vminpbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vminbf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vminbf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf5,0x65,0x18,0x5d,0x10
-# ATT: vminpbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vminpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vminbf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vminbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x65,0x08,0x5d,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vminpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vminpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vminbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vminbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf5,0x65,0x8f,0x5d,0x51,0x7f
-# ATT: vminpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vminpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vminbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vminbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf5,0x65,0x9f,0x5d,0x52,0x80
-# ATT: vmulnepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vmulnepbf16 ymm2, ymm3, ymm4
+# ATT: vmulbf16 %ymm4, %ymm3, %ymm2
+# INTEL: vmulbf16 ymm2, ymm3, ymm4
0x62,0xf5,0x65,0x28,0x59,0xd4
-# ATT: vmulnepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vmulnepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vmulbf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vmulbf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf5,0x65,0x2f,0x59,0xd4
-# ATT: vmulnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vmulnepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vmulbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vmulbf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf5,0x65,0xaf,0x59,0xd4
-# ATT: vmulnepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vmulnepbf16 zmm2, zmm3, zmm4
+# ATT: vmulbf16 %zmm4, %zmm3, %zmm2
+# INTEL: vmulbf16 zmm2, zmm3, zmm4
0x62,0xf5,0x65,0x48,0x59,0xd4
-# ATT: vmulnepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vmulnepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vmulbf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vmulbf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf5,0x65,0x4f,0x59,0xd4
-# ATT: vmulnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vmulnepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vmulbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vmulbf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf5,0x65,0xcf,0x59,0xd4
-# ATT: vmulnepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vmulnepbf16 xmm2, xmm3, xmm4
+# ATT: vmulbf16 %xmm4, %xmm3, %xmm2
+# INTEL: vmulbf16 xmm2, xmm3, xmm4
0x62,0xf5,0x65,0x08,0x59,0xd4
-# ATT: vmulnepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vmulnepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vmulbf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vmulbf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf5,0x65,0x0f,0x59,0xd4
-# ATT: vmulnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vmulnepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vmulbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vmulbf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf5,0x65,0x8f,0x59,0xd4
-# ATT: vmulnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vmulnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vmulbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vmulbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x48,0x59,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vmulnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vmulnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vmulbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vmulbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x4f,0x59,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vmulnepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vmulnepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vmulbf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vmulbf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf5,0x65,0x58,0x59,0x10
-# ATT: vmulnepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vmulnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vmulbf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vmulbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x65,0x48,0x59,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vmulnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vmulnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vmulbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vmulbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf5,0x65,0xcf,0x59,0x51,0x7f
-# ATT: vmulnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vmulnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vmulbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vmulbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf5,0x65,0xdf,0x59,0x52,0x80
-# ATT: vmulnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vmulnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vmulbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vmulbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x28,0x59,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vmulnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vmulnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vmulbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vmulbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x2f,0x59,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vmulnepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vmulnepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vmulbf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vmulbf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf5,0x65,0x38,0x59,0x10
-# ATT: vmulnepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vmulnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vmulbf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vmulbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x65,0x28,0x59,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vmulnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vmulnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vmulbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vmulbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf5,0x65,0xaf,0x59,0x51,0x7f
-# ATT: vmulnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vmulnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vmulbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vmulbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf5,0x65,0xbf,0x59,0x52,0x80
-# ATT: vmulnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vmulnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vmulbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vmulbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x08,0x59,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vmulnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vmulnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vmulbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vmulbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x0f,0x59,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vmulnepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vmulnepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vmulbf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vmulbf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf5,0x65,0x18,0x59,0x10
-# ATT: vmulnepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vmulnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vmulbf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vmulbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x65,0x08,0x59,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vmulnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vmulnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vmulbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vmulbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf5,0x65,0x8f,0x59,0x51,0x7f
-# ATT: vmulnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vmulnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vmulbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vmulbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf5,0x65,0x9f,0x59,0x52,0x80
-# ATT: vrcppbf16 %xmm3, %xmm2
-# INTEL: vrcppbf16 xmm2, xmm3
+# ATT: vrcpbf16 %xmm3, %xmm2
+# INTEL: vrcpbf16 xmm2, xmm3
0x62,0xf6,0x7c,0x08,0x4c,0xd3
-# ATT: vrcppbf16 %xmm3, %xmm2 {%k7}
-# INTEL: vrcppbf16 xmm2 {k7}, xmm3
+# ATT: vrcpbf16 %xmm3, %xmm2 {%k7}
+# INTEL: vrcpbf16 xmm2 {k7}, xmm3
0x62,0xf6,0x7c,0x0f,0x4c,0xd3
-# ATT: vrcppbf16 %xmm3, %xmm2 {%k7} {z}
-# INTEL: vrcppbf16 xmm2 {k7} {z}, xmm3
+# ATT: vrcpbf16 %xmm3, %xmm2 {%k7} {z}
+# INTEL: vrcpbf16 xmm2 {k7} {z}, xmm3
0x62,0xf6,0x7c,0x8f,0x4c,0xd3
-# ATT: vrcppbf16 %zmm3, %zmm2
-# INTEL: vrcppbf16 zmm2, zmm3
+# ATT: vrcpbf16 %zmm3, %zmm2
+# INTEL: vrcpbf16 zmm2, zmm3
0x62,0xf6,0x7c,0x48,0x4c,0xd3
-# ATT: vrcppbf16 %zmm3, %zmm2 {%k7}
-# INTEL: vrcppbf16 zmm2 {k7}, zmm3
+# ATT: vrcpbf16 %zmm3, %zmm2 {%k7}
+# INTEL: vrcpbf16 zmm2 {k7}, zmm3
0x62,0xf6,0x7c,0x4f,0x4c,0xd3
-# ATT: vrcppbf16 %zmm3, %zmm2 {%k7} {z}
-# INTEL: vrcppbf16 zmm2 {k7} {z}, zmm3
+# ATT: vrcpbf16 %zmm3, %zmm2 {%k7} {z}
+# INTEL: vrcpbf16 zmm2 {k7} {z}, zmm3
0x62,0xf6,0x7c,0xcf,0x4c,0xd3
-# ATT: vrcppbf16 %ymm3, %ymm2
-# INTEL: vrcppbf16 ymm2, ymm3
+# ATT: vrcpbf16 %ymm3, %ymm2
+# INTEL: vrcpbf16 ymm2, ymm3
0x62,0xf6,0x7c,0x28,0x4c,0xd3
-# ATT: vrcppbf16 %ymm3, %ymm2 {%k7}
-# INTEL: vrcppbf16 ymm2 {k7}, ymm3
+# ATT: vrcpbf16 %ymm3, %ymm2 {%k7}
+# INTEL: vrcpbf16 ymm2 {k7}, ymm3
0x62,0xf6,0x7c,0x2f,0x4c,0xd3
-# ATT: vrcppbf16 %ymm3, %ymm2 {%k7} {z}
-# INTEL: vrcppbf16 ymm2 {k7} {z}, ymm3
+# ATT: vrcpbf16 %ymm3, %ymm2 {%k7} {z}
+# INTEL: vrcpbf16 ymm2 {k7} {z}, ymm3
0x62,0xf6,0x7c,0xaf,0x4c,0xd3
-# ATT: vrcppbf16 268435456(%esp,%esi,8), %xmm2
-# INTEL: vrcppbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vrcpbf16 268435456(%esp,%esi,8), %xmm2
+# INTEL: vrcpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x7c,0x08,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vrcppbf16 291(%edi,%eax,4), %xmm2 {%k7}
-# INTEL: vrcppbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
+# ATT: vrcpbf16 291(%edi,%eax,4), %xmm2 {%k7}
+# INTEL: vrcpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x7c,0x0f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vrcppbf16 (%eax){1to8}, %xmm2
-# INTEL: vrcppbf16 xmm2, word ptr [eax]{1to8}
+# ATT: vrcpbf16 (%eax){1to8}, %xmm2
+# INTEL: vrcpbf16 xmm2, word ptr [eax]{1to8}
0x62,0xf6,0x7c,0x18,0x4c,0x10
-# ATT: vrcppbf16 -512(,%ebp,2), %xmm2
-# INTEL: vrcppbf16 xmm2, xmmword ptr [2*ebp - 512]
+# ATT: vrcpbf16 -512(,%ebp,2), %xmm2
+# INTEL: vrcpbf16 xmm2, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x7c,0x08,0x4c,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vrcppbf16 2032(%ecx), %xmm2 {%k7} {z}
-# INTEL: vrcppbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
+# ATT: vrcpbf16 2032(%ecx), %xmm2 {%k7} {z}
+# INTEL: vrcpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
0x62,0xf6,0x7c,0x8f,0x4c,0x51,0x7f
-# ATT: vrcppbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
-# INTEL: vrcppbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
+# ATT: vrcpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
+# INTEL: vrcpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
0x62,0xf6,0x7c,0x9f,0x4c,0x52,0x80
-# ATT: vrcppbf16 268435456(%esp,%esi,8), %ymm2
-# INTEL: vrcppbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vrcpbf16 268435456(%esp,%esi,8), %ymm2
+# INTEL: vrcpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x7c,0x28,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vrcppbf16 291(%edi,%eax,4), %ymm2 {%k7}
-# INTEL: vrcppbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
+# ATT: vrcpbf16 291(%edi,%eax,4), %ymm2 {%k7}
+# INTEL: vrcpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x7c,0x2f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vrcppbf16 (%eax){1to16}, %ymm2
-# INTEL: vrcppbf16 ymm2, word ptr [eax]{1to16}
+# ATT: vrcpbf16 (%eax){1to16}, %ymm2
+# INTEL: vrcpbf16 ymm2, word ptr [eax]{1to16}
0x62,0xf6,0x7c,0x38,0x4c,0x10
-# ATT: vrcppbf16 -1024(,%ebp,2), %ymm2
-# INTEL: vrcppbf16 ymm2, ymmword ptr [2*ebp - 1024]
+# ATT: vrcpbf16 -1024(,%ebp,2), %ymm2
+# INTEL: vrcpbf16 ymm2, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x7c,0x28,0x4c,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vrcppbf16 4064(%ecx), %ymm2 {%k7} {z}
-# INTEL: vrcppbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
+# ATT: vrcpbf16 4064(%ecx), %ymm2 {%k7} {z}
+# INTEL: vrcpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
0x62,0xf6,0x7c,0xaf,0x4c,0x51,0x7f
-# ATT: vrcppbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
-# INTEL: vrcppbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
+# ATT: vrcpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
+# INTEL: vrcpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
0x62,0xf6,0x7c,0xbf,0x4c,0x52,0x80
-# ATT: vrcppbf16 268435456(%esp,%esi,8), %zmm2
-# INTEL: vrcppbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vrcpbf16 268435456(%esp,%esi,8), %zmm2
+# INTEL: vrcpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x7c,0x48,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vrcppbf16 291(%edi,%eax,4), %zmm2 {%k7}
-# INTEL: vrcppbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
+# ATT: vrcpbf16 291(%edi,%eax,4), %zmm2 {%k7}
+# INTEL: vrcpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x7c,0x4f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vrcppbf16 (%eax){1to32}, %zmm2
-# INTEL: vrcppbf16 zmm2, word ptr [eax]{1to32}
+# ATT: vrcpbf16 (%eax){1to32}, %zmm2
+# INTEL: vrcpbf16 zmm2, word ptr [eax]{1to32}
0x62,0xf6,0x7c,0x58,0x4c,0x10
-# ATT: vrcppbf16 -2048(,%ebp,2), %zmm2
-# INTEL: vrcppbf16 zmm2, zmmword ptr [2*ebp - 2048]
+# ATT: vrcpbf16 -2048(,%ebp,2), %zmm2
+# INTEL: vrcpbf16 zmm2, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x7c,0x48,0x4c,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vrcppbf16 8128(%ecx), %zmm2 {%k7} {z}
-# INTEL: vrcppbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
+# ATT: vrcpbf16 8128(%ecx), %zmm2 {%k7} {z}
+# INTEL: vrcpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
0x62,0xf6,0x7c,0xcf,0x4c,0x51,0x7f
-# ATT: vrcppbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
-# INTEL: vrcppbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
+# ATT: vrcpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
+# INTEL: vrcpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
0x62,0xf6,0x7c,0xdf,0x4c,0x52,0x80
-# ATT: vreducenepbf16 $123, %zmm3, %zmm2
-# INTEL: vreducenepbf16 zmm2, zmm3, 123
+# ATT: vreducebf16 $123, %zmm3, %zmm2
+# INTEL: vreducebf16 zmm2, zmm3, 123
0x62,0xf3,0x7f,0x48,0x56,0xd3,0x7b
-# ATT: vreducenepbf16 $123, %zmm3, %zmm2 {%k7}
-# INTEL: vreducenepbf16 zmm2 {k7}, zmm3, 123
+# ATT: vreducebf16 $123, %zmm3, %zmm2 {%k7}
+# INTEL: vreducebf16 zmm2 {k7}, zmm3, 123
0x62,0xf3,0x7f,0x4f,0x56,0xd3,0x7b
-# ATT: vreducenepbf16 $123, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vreducenepbf16 zmm2 {k7} {z}, zmm3, 123
+# ATT: vreducebf16 $123, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vreducebf16 zmm2 {k7} {z}, zmm3, 123
0x62,0xf3,0x7f,0xcf,0x56,0xd3,0x7b
-# ATT: vreducenepbf16 $123, %ymm3, %ymm2
-# INTEL: vreducenepbf16 ymm2, ymm3, 123
+# ATT: vreducebf16 $123, %ymm3, %ymm2
+# INTEL: vreducebf16 ymm2, ymm3, 123
0x62,0xf3,0x7f,0x28,0x56,0xd3,0x7b
-# ATT: vreducenepbf16 $123, %ymm3, %ymm2 {%k7}
-# INTEL: vreducenepbf16 ymm2 {k7}, ymm3, 123
+# ATT: vreducebf16 $123, %ymm3, %ymm2 {%k7}
+# INTEL: vreducebf16 ymm2 {k7}, ymm3, 123
0x62,0xf3,0x7f,0x2f,0x56,0xd3,0x7b
-# ATT: vreducenepbf16 $123, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vreducenepbf16 ymm2 {k7} {z}, ymm3, 123
+# ATT: vreducebf16 $123, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vreducebf16 ymm2 {k7} {z}, ymm3, 123
0x62,0xf3,0x7f,0xaf,0x56,0xd3,0x7b
-# ATT: vreducenepbf16 $123, %xmm3, %xmm2
-# INTEL: vreducenepbf16 xmm2, xmm3, 123
+# ATT: vreducebf16 $123, %xmm3, %xmm2
+# INTEL: vreducebf16 xmm2, xmm3, 123
0x62,0xf3,0x7f,0x08,0x56,0xd3,0x7b
-# ATT: vreducenepbf16 $123, %xmm3, %xmm2 {%k7}
-# INTEL: vreducenepbf16 xmm2 {k7}, xmm3, 123
+# ATT: vreducebf16 $123, %xmm3, %xmm2 {%k7}
+# INTEL: vreducebf16 xmm2 {k7}, xmm3, 123
0x62,0xf3,0x7f,0x0f,0x56,0xd3,0x7b
-# ATT: vreducenepbf16 $123, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vreducenepbf16 xmm2 {k7} {z}, xmm3, 123
+# ATT: vreducebf16 $123, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vreducebf16 xmm2 {k7} {z}, xmm3, 123
0x62,0xf3,0x7f,0x8f,0x56,0xd3,0x7b
-# ATT: vreducenepbf16 $123, 268435456(%esp,%esi,8), %xmm2
-# INTEL: vreducenepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
+# ATT: vreducebf16 $123, 268435456(%esp,%esi,8), %xmm2
+# INTEL: vreducebf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x08,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b
-# ATT: vreducenepbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
-# INTEL: vreducenepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
+# ATT: vreducebf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
+# INTEL: vreducebf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x0f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b
-# ATT: vreducenepbf16 $123, (%eax){1to8}, %xmm2
-# INTEL: vreducenepbf16 xmm2, word ptr [eax]{1to8}, 123
+# ATT: vreducebf16 $123, (%eax){1to8}, %xmm2
+# INTEL: vreducebf16 xmm2, word ptr [eax]{1to8}, 123
0x62,0xf3,0x7f,0x18,0x56,0x10,0x7b
-# ATT: vreducenepbf16 $123, -512(,%ebp,2), %xmm2
-# INTEL: vreducenepbf16 xmm2, xmmword ptr [2*ebp - 512], 123
+# ATT: vreducebf16 $123, -512(,%ebp,2), %xmm2
+# INTEL: vreducebf16 xmm2, xmmword ptr [2*ebp - 512], 123
0x62,0xf3,0x7f,0x08,0x56,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b
-# ATT: vreducenepbf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
-# INTEL: vreducenepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
+# ATT: vreducebf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
+# INTEL: vreducebf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
0x62,0xf3,0x7f,0x8f,0x56,0x51,0x7f,0x7b
-# ATT: vreducenepbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
-# INTEL: vreducenepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
+# ATT: vreducebf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
+# INTEL: vreducebf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
0x62,0xf3,0x7f,0x9f,0x56,0x52,0x80,0x7b
-# ATT: vreducenepbf16 $123, 268435456(%esp,%esi,8), %ymm2
-# INTEL: vreducenepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
+# ATT: vreducebf16 $123, 268435456(%esp,%esi,8), %ymm2
+# INTEL: vreducebf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x28,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b
-# ATT: vreducenepbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
-# INTEL: vreducenepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
+# ATT: vreducebf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
+# INTEL: vreducebf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x2f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b
-# ATT: vreducenepbf16 $123, (%eax){1to16}, %ymm2
-# INTEL: vreducenepbf16 ymm2, word ptr [eax]{1to16}, 123
+# ATT: vreducebf16 $123, (%eax){1to16}, %ymm2
+# INTEL: vreducebf16 ymm2, word ptr [eax]{1to16}, 123
0x62,0xf3,0x7f,0x38,0x56,0x10,0x7b
-# ATT: vreducenepbf16 $123, -1024(,%ebp,2), %ymm2
-# INTEL: vreducenepbf16 ymm2, ymmword ptr [2*ebp - 1024], 123
+# ATT: vreducebf16 $123, -1024(,%ebp,2), %ymm2
+# INTEL: vreducebf16 ymm2, ymmword ptr [2*ebp - 1024], 123
0x62,0xf3,0x7f,0x28,0x56,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b
-# ATT: vreducenepbf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
-# INTEL: vreducenepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
+# ATT: vreducebf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
+# INTEL: vreducebf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
0x62,0xf3,0x7f,0xaf,0x56,0x51,0x7f,0x7b
-# ATT: vreducenepbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
-# INTEL: vreducenepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
+# ATT: vreducebf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
+# INTEL: vreducebf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
0x62,0xf3,0x7f,0xbf,0x56,0x52,0x80,0x7b
-# ATT: vreducenepbf16 $123, 268435456(%esp,%esi,8), %zmm2
-# INTEL: vreducenepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
+# ATT: vreducebf16 $123, 268435456(%esp,%esi,8), %zmm2
+# INTEL: vreducebf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x48,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b
-# ATT: vreducenepbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
-# INTEL: vreducenepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
+# ATT: vreducebf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
+# INTEL: vreducebf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x4f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b
-# ATT: vreducenepbf16 $123, (%eax){1to32}, %zmm2
-# INTEL: vreducenepbf16 zmm2, word ptr [eax]{1to32}, 123
+# ATT: vreducebf16 $123, (%eax){1to32}, %zmm2
+# INTEL: vreducebf16 zmm2, word ptr [eax]{1to32}, 123
0x62,0xf3,0x7f,0x58,0x56,0x10,0x7b
-# ATT: vreducenepbf16 $123, -2048(,%ebp,2), %zmm2
-# INTEL: vreducenepbf16 zmm2, zmmword ptr [2*ebp - 2048], 123
+# ATT: vreducebf16 $123, -2048(,%ebp,2), %zmm2
+# INTEL: vreducebf16 zmm2, zmmword ptr [2*ebp - 2048], 123
0x62,0xf3,0x7f,0x48,0x56,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b
-# ATT: vreducenepbf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
-# INTEL: vreducenepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
+# ATT: vreducebf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
+# INTEL: vreducebf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
0x62,0xf3,0x7f,0xcf,0x56,0x51,0x7f,0x7b
-# ATT: vreducenepbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
-# INTEL: vreducenepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
+# ATT: vreducebf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
+# INTEL: vreducebf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
0x62,0xf3,0x7f,0xdf,0x56,0x52,0x80,0x7b
-# ATT: vrndscalenepbf16 $123, %zmm3, %zmm2
-# INTEL: vrndscalenepbf16 zmm2, zmm3, 123
+# ATT: vrndscalebf16 $123, %zmm3, %zmm2
+# INTEL: vrndscalebf16 zmm2, zmm3, 123
0x62,0xf3,0x7f,0x48,0x08,0xd3,0x7b
-# ATT: vrndscalenepbf16 $123, %zmm3, %zmm2 {%k7}
-# INTEL: vrndscalenepbf16 zmm2 {k7}, zmm3, 123
+# ATT: vrndscalebf16 $123, %zmm3, %zmm2 {%k7}
+# INTEL: vrndscalebf16 zmm2 {k7}, zmm3, 123
0x62,0xf3,0x7f,0x4f,0x08,0xd3,0x7b
-# ATT: vrndscalenepbf16 $123, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vrndscalenepbf16 zmm2 {k7} {z}, zmm3, 123
+# ATT: vrndscalebf16 $123, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vrndscalebf16 zmm2 {k7} {z}, zmm3, 123
0x62,0xf3,0x7f,0xcf,0x08,0xd3,0x7b
-# ATT: vrndscalenepbf16 $123, %ymm3, %ymm2
-# INTEL: vrndscalenepbf16 ymm2, ymm3, 123
+# ATT: vrndscalebf16 $123, %ymm3, %ymm2
+# INTEL: vrndscalebf16 ymm2, ymm3, 123
0x62,0xf3,0x7f,0x28,0x08,0xd3,0x7b
-# ATT: vrndscalenepbf16 $123, %ymm3, %ymm2 {%k7}
-# INTEL: vrndscalenepbf16 ymm2 {k7}, ymm3, 123
+# ATT: vrndscalebf16 $123, %ymm3, %ymm2 {%k7}
+# INTEL: vrndscalebf16 ymm2 {k7}, ymm3, 123
0x62,0xf3,0x7f,0x2f,0x08,0xd3,0x7b
-# ATT: vrndscalenepbf16 $123, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vrndscalenepbf16 ymm2 {k7} {z}, ymm3, 123
+# ATT: vrndscalebf16 $123, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vrndscalebf16 ymm2 {k7} {z}, ymm3, 123
0x62,0xf3,0x7f,0xaf,0x08,0xd3,0x7b
-# ATT: vrndscalenepbf16 $123, %xmm3, %xmm2
-# INTEL: vrndscalenepbf16 xmm2, xmm3, 123
+# ATT: vrndscalebf16 $123, %xmm3, %xmm2
+# INTEL: vrndscalebf16 xmm2, xmm3, 123
0x62,0xf3,0x7f,0x08,0x08,0xd3,0x7b
-# ATT: vrndscalenepbf16 $123, %xmm3, %xmm2 {%k7}
-# INTEL: vrndscalenepbf16 xmm2 {k7}, xmm3, 123
+# ATT: vrndscalebf16 $123, %xmm3, %xmm2 {%k7}
+# INTEL: vrndscalebf16 xmm2 {k7}, xmm3, 123
0x62,0xf3,0x7f,0x0f,0x08,0xd3,0x7b
-# ATT: vrndscalenepbf16 $123, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vrndscalenepbf16 xmm2 {k7} {z}, xmm3, 123
+# ATT: vrndscalebf16 $123, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vrndscalebf16 xmm2 {k7} {z}, xmm3, 123
0x62,0xf3,0x7f,0x8f,0x08,0xd3,0x7b
-# ATT: vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %xmm2
-# INTEL: vrndscalenepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
+# ATT: vrndscalebf16 $123, 268435456(%esp,%esi,8), %xmm2
+# INTEL: vrndscalebf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x08,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b
-# ATT: vrndscalenepbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
-# INTEL: vrndscalenepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
+# ATT: vrndscalebf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
+# INTEL: vrndscalebf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x0f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b
-# ATT: vrndscalenepbf16 $123, (%eax){1to8}, %xmm2
-# INTEL: vrndscalenepbf16 xmm2, word ptr [eax]{1to8}, 123
+# ATT: vrndscalebf16 $123, (%eax){1to8}, %xmm2
+# INTEL: vrndscalebf16 xmm2, word ptr [eax]{1to8}, 123
0x62,0xf3,0x7f,0x18,0x08,0x10,0x7b
-# ATT: vrndscalenepbf16 $123, -512(,%ebp,2), %xmm2
-# INTEL: vrndscalenepbf16 xmm2, xmmword ptr [2*ebp - 512], 123
+# ATT: vrndscalebf16 $123, -512(,%ebp,2), %xmm2
+# INTEL: vrndscalebf16 xmm2, xmmword ptr [2*ebp - 512], 123
0x62,0xf3,0x7f,0x08,0x08,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b
-# ATT: vrndscalenepbf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
-# INTEL: vrndscalenepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
+# ATT: vrndscalebf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
+# INTEL: vrndscalebf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
0x62,0xf3,0x7f,0x8f,0x08,0x51,0x7f,0x7b
-# ATT: vrndscalenepbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
-# INTEL: vrndscalenepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
+# ATT: vrndscalebf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
+# INTEL: vrndscalebf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
0x62,0xf3,0x7f,0x9f,0x08,0x52,0x80,0x7b
-# ATT: vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %ymm2
-# INTEL: vrndscalenepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
+# ATT: vrndscalebf16 $123, 268435456(%esp,%esi,8), %ymm2
+# INTEL: vrndscalebf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x28,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b
-# ATT: vrndscalenepbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
-# INTEL: vrndscalenepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
+# ATT: vrndscalebf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
+# INTEL: vrndscalebf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x2f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b
-# ATT: vrndscalenepbf16 $123, (%eax){1to16}, %ymm2
-# INTEL: vrndscalenepbf16 ymm2, word ptr [eax]{1to16}, 123
+# ATT: vrndscalebf16 $123, (%eax){1to16}, %ymm2
+# INTEL: vrndscalebf16 ymm2, word ptr [eax]{1to16}, 123
0x62,0xf3,0x7f,0x38,0x08,0x10,0x7b
-# ATT: vrndscalenepbf16 $123, -1024(,%ebp,2), %ymm2
-# INTEL: vrndscalenepbf16 ymm2, ymmword ptr [2*ebp - 1024], 123
+# ATT: vrndscalebf16 $123, -1024(,%ebp,2), %ymm2
+# INTEL: vrndscalebf16 ymm2, ymmword ptr [2*ebp - 1024], 123
0x62,0xf3,0x7f,0x28,0x08,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b
-# ATT: vrndscalenepbf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
-# INTEL: vrndscalenepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
+# ATT: vrndscalebf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
+# INTEL: vrndscalebf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
0x62,0xf3,0x7f,0xaf,0x08,0x51,0x7f,0x7b
-# ATT: vrndscalenepbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
-# INTEL: vrndscalenepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
+# ATT: vrndscalebf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
+# INTEL: vrndscalebf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
0x62,0xf3,0x7f,0xbf,0x08,0x52,0x80,0x7b
-# ATT: vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %zmm2
-# INTEL: vrndscalenepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
+# ATT: vrndscalebf16 $123, 268435456(%esp,%esi,8), %zmm2
+# INTEL: vrndscalebf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x48,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b
-# ATT: vrndscalenepbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
-# INTEL: vrndscalenepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
+# ATT: vrndscalebf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
+# INTEL: vrndscalebf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x4f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b
-# ATT: vrndscalenepbf16 $123, (%eax){1to32}, %zmm2
-# INTEL: vrndscalenepbf16 zmm2, word ptr [eax]{1to32}, 123
+# ATT: vrndscalebf16 $123, (%eax){1to32}, %zmm2
+# INTEL: vrndscalebf16 zmm2, word ptr [eax]{1to32}, 123
0x62,0xf3,0x7f,0x58,0x08,0x10,0x7b
-# ATT: vrndscalenepbf16 $123, -2048(,%ebp,2), %zmm2
-# INTEL: vrndscalenepbf16 zmm2, zmmword ptr [2*ebp - 2048], 123
+# ATT: vrndscalebf16 $123, -2048(,%ebp,2), %zmm2
+# INTEL: vrndscalebf16 zmm2, zmmword ptr [2*ebp - 2048], 123
0x62,0xf3,0x7f,0x48,0x08,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b
-# ATT: vrndscalenepbf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
-# INTEL: vrndscalenepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
+# ATT: vrndscalebf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
+# INTEL: vrndscalebf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
0x62,0xf3,0x7f,0xcf,0x08,0x51,0x7f,0x7b
-# ATT: vrndscalenepbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
-# INTEL: vrndscalenepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
+# ATT: vrndscalebf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
+# INTEL: vrndscalebf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
0x62,0xf3,0x7f,0xdf,0x08,0x52,0x80,0x7b
-# ATT: vrsqrtpbf16 %xmm3, %xmm2
-# INTEL: vrsqrtpbf16 xmm2, xmm3
+# ATT: vrsqrtbf16 %xmm3, %xmm2
+# INTEL: vrsqrtbf16 xmm2, xmm3
0x62,0xf6,0x7c,0x08,0x4e,0xd3
-# ATT: vrsqrtpbf16 %xmm3, %xmm2 {%k7}
-# INTEL: vrsqrtpbf16 xmm2 {k7}, xmm3
+# ATT: vrsqrtbf16 %xmm3, %xmm2 {%k7}
+# INTEL: vrsqrtbf16 xmm2 {k7}, xmm3
0x62,0xf6,0x7c,0x0f,0x4e,0xd3
-# ATT: vrsqrtpbf16 %xmm3, %xmm2 {%k7} {z}
-# INTEL: vrsqrtpbf16 xmm2 {k7} {z}, xmm3
+# ATT: vrsqrtbf16 %xmm3, %xmm2 {%k7} {z}
+# INTEL: vrsqrtbf16 xmm2 {k7} {z}, xmm3
0x62,0xf6,0x7c,0x8f,0x4e,0xd3
-# ATT: vrsqrtpbf16 %zmm3, %zmm2
-# INTEL: vrsqrtpbf16 zmm2, zmm3
+# ATT: vrsqrtbf16 %zmm3, %zmm2
+# INTEL: vrsqrtbf16 zmm2, zmm3
0x62,0xf6,0x7c,0x48,0x4e,0xd3
-# ATT: vrsqrtpbf16 %zmm3, %zmm2 {%k7}
-# INTEL: vrsqrtpbf16 zmm2 {k7}, zmm3
+# ATT: vrsqrtbf16 %zmm3, %zmm2 {%k7}
+# INTEL: vrsqrtbf16 zmm2 {k7}, zmm3
0x62,0xf6,0x7c,0x4f,0x4e,0xd3
-# ATT: vrsqrtpbf16 %zmm3, %zmm2 {%k7} {z}
-# INTEL: vrsqrtpbf16 zmm2 {k7} {z}, zmm3
+# ATT: vrsqrtbf16 %zmm3, %zmm2 {%k7} {z}
+# INTEL: vrsqrtbf16 zmm2 {k7} {z}, zmm3
0x62,0xf6,0x7c,0xcf,0x4e,0xd3
-# ATT: vrsqrtpbf16 %ymm3, %ymm2
-# INTEL: vrsqrtpbf16 ymm2, ymm3
+# ATT: vrsqrtbf16 %ymm3, %ymm2
+# INTEL: vrsqrtbf16 ymm2, ymm3
0x62,0xf6,0x7c,0x28,0x4e,0xd3
-# ATT: vrsqrtpbf16 %ymm3, %ymm2 {%k7}
-# INTEL: vrsqrtpbf16 ymm2 {k7}, ymm3
+# ATT: vrsqrtbf16 %ymm3, %ymm2 {%k7}
+# INTEL: vrsqrtbf16 ymm2 {k7}, ymm3
0x62,0xf6,0x7c,0x2f,0x4e,0xd3
-# ATT: vrsqrtpbf16 %ymm3, %ymm2 {%k7} {z}
-# INTEL: vrsqrtpbf16 ymm2 {k7} {z}, ymm3
+# ATT: vrsqrtbf16 %ymm3, %ymm2 {%k7} {z}
+# INTEL: vrsqrtbf16 ymm2 {k7} {z}, ymm3
0x62,0xf6,0x7c,0xaf,0x4e,0xd3
-# ATT: vrsqrtpbf16 268435456(%esp,%esi,8), %xmm2
-# INTEL: vrsqrtpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vrsqrtbf16 268435456(%esp,%esi,8), %xmm2
+# INTEL: vrsqrtbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x7c,0x08,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vrsqrtpbf16 291(%edi,%eax,4), %xmm2 {%k7}
-# INTEL: vrsqrtpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
+# ATT: vrsqrtbf16 291(%edi,%eax,4), %xmm2 {%k7}
+# INTEL: vrsqrtbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x7c,0x0f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vrsqrtpbf16 (%eax){1to8}, %xmm2
-# INTEL: vrsqrtpbf16 xmm2, word ptr [eax]{1to8}
+# ATT: vrsqrtbf16 (%eax){1to8}, %xmm2
+# INTEL: vrsqrtbf16 xmm2, word ptr [eax]{1to8}
0x62,0xf6,0x7c,0x18,0x4e,0x10
-# ATT: vrsqrtpbf16 -512(,%ebp,2), %xmm2
-# INTEL: vrsqrtpbf16 xmm2, xmmword ptr [2*ebp - 512]
+# ATT: vrsqrtbf16 -512(,%ebp,2), %xmm2
+# INTEL: vrsqrtbf16 xmm2, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x7c,0x08,0x4e,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vrsqrtpbf16 2032(%ecx), %xmm2 {%k7} {z}
-# INTEL: vrsqrtpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
+# ATT: vrsqrtbf16 2032(%ecx), %xmm2 {%k7} {z}
+# INTEL: vrsqrtbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
0x62,0xf6,0x7c,0x8f,0x4e,0x51,0x7f
-# ATT: vrsqrtpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
-# INTEL: vrsqrtpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
+# ATT: vrsqrtbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
+# INTEL: vrsqrtbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
0x62,0xf6,0x7c,0x9f,0x4e,0x52,0x80
-# ATT: vrsqrtpbf16 268435456(%esp,%esi,8), %ymm2
-# INTEL: vrsqrtpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vrsqrtbf16 268435456(%esp,%esi,8), %ymm2
+# INTEL: vrsqrtbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x7c,0x28,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vrsqrtpbf16 291(%edi,%eax,4), %ymm2 {%k7}
-# INTEL: vrsqrtpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
+# ATT: vrsqrtbf16 291(%edi,%eax,4), %ymm2 {%k7}
+# INTEL: vrsqrtbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x7c,0x2f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vrsqrtpbf16 (%eax){1to16}, %ymm2
-# INTEL: vrsqrtpbf16 ymm2, word ptr [eax]{1to16}
+# ATT: vrsqrtbf16 (%eax){1to16}, %ymm2
+# INTEL: vrsqrtbf16 ymm2, word ptr [eax]{1to16}
0x62,0xf6,0x7c,0x38,0x4e,0x10
-# ATT: vrsqrtpbf16 -1024(,%ebp,2), %ymm2
-# INTEL: vrsqrtpbf16 ymm2, ymmword ptr [2*ebp - 1024]
+# ATT: vrsqrtbf16 -1024(,%ebp,2), %ymm2
+# INTEL: vrsqrtbf16 ymm2, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x7c,0x28,0x4e,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vrsqrtpbf16 4064(%ecx), %ymm2 {%k7} {z}
-# INTEL: vrsqrtpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
+# ATT: vrsqrtbf16 4064(%ecx), %ymm2 {%k7} {z}
+# INTEL: vrsqrtbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
0x62,0xf6,0x7c,0xaf,0x4e,0x51,0x7f
-# ATT: vrsqrtpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
-# INTEL: vrsqrtpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
+# ATT: vrsqrtbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
+# INTEL: vrsqrtbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
0x62,0xf6,0x7c,0xbf,0x4e,0x52,0x80
-# ATT: vrsqrtpbf16 268435456(%esp,%esi,8), %zmm2
-# INTEL: vrsqrtpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vrsqrtbf16 268435456(%esp,%esi,8), %zmm2
+# INTEL: vrsqrtbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x7c,0x48,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vrsqrtpbf16 291(%edi,%eax,4), %zmm2 {%k7}
-# INTEL: vrsqrtpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
+# ATT: vrsqrtbf16 291(%edi,%eax,4), %zmm2 {%k7}
+# INTEL: vrsqrtbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x7c,0x4f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vrsqrtpbf16 (%eax){1to32}, %zmm2
-# INTEL: vrsqrtpbf16 zmm2, word ptr [eax]{1to32}
+# ATT: vrsqrtbf16 (%eax){1to32}, %zmm2
+# INTEL: vrsqrtbf16 zmm2, word ptr [eax]{1to32}
0x62,0xf6,0x7c,0x58,0x4e,0x10
-# ATT: vrsqrtpbf16 -2048(,%ebp,2), %zmm2
-# INTEL: vrsqrtpbf16 zmm2, zmmword ptr [2*ebp - 2048]
+# ATT: vrsqrtbf16 -2048(,%ebp,2), %zmm2
+# INTEL: vrsqrtbf16 zmm2, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x7c,0x48,0x4e,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vrsqrtpbf16 8128(%ecx), %zmm2 {%k7} {z}
-# INTEL: vrsqrtpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
+# ATT: vrsqrtbf16 8128(%ecx), %zmm2 {%k7} {z}
+# INTEL: vrsqrtbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
0x62,0xf6,0x7c,0xcf,0x4e,0x51,0x7f
-# ATT: vrsqrtpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
-# INTEL: vrsqrtpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
+# ATT: vrsqrtbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
+# INTEL: vrsqrtbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
0x62,0xf6,0x7c,0xdf,0x4e,0x52,0x80
-# ATT: vscalefpbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vscalefpbf16 ymm2, ymm3, ymm4
+# ATT: vscalefbf16 %ymm4, %ymm3, %ymm2
+# INTEL: vscalefbf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0x2c,0xd4
-# ATT: vscalefpbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vscalefpbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vscalefbf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vscalefbf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0x2c,0xd4
-# ATT: vscalefpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vscalefpbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vscalefbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vscalefbf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0x2c,0xd4
-# ATT: vscalefpbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vscalefpbf16 zmm2, zmm3, zmm4
+# ATT: vscalefbf16 %zmm4, %zmm3, %zmm2
+# INTEL: vscalefbf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0x2c,0xd4
-# ATT: vscalefpbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vscalefpbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vscalefbf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vscalefbf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0x2c,0xd4
-# ATT: vscalefpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vscalefpbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vscalefbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vscalefbf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0x2c,0xd4
-# ATT: vscalefpbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vscalefpbf16 xmm2, xmm3, xmm4
+# ATT: vscalefbf16 %xmm4, %xmm3, %xmm2
+# INTEL: vscalefbf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0x2c,0xd4
-# ATT: vscalefpbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vscalefpbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vscalefbf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vscalefbf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0x2c,0xd4
-# ATT: vscalefpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vscalefpbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vscalefbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vscalefbf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0x2c,0xd4
-# ATT: vscalefpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vscalefpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vscalefbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vscalefbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vscalefpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vscalefpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vscalefbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vscalefbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vscalefpbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vscalefpbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vscalefbf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vscalefbf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0x2c,0x10
-# ATT: vscalefpbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vscalefpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vscalefbf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vscalefbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0x2c,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vscalefpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vscalefpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vscalefbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vscalefbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0x2c,0x51,0x7f
-# ATT: vscalefpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vscalefpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vscalefbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vscalefbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0x2c,0x52,0x80
-# ATT: vscalefpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vscalefpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vscalefbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vscalefbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vscalefpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vscalefpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vscalefbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vscalefbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vscalefpbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vscalefpbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vscalefbf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vscalefbf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0x2c,0x10
-# ATT: vscalefpbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vscalefpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vscalefbf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vscalefbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0x2c,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vscalefpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vscalefpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vscalefbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vscalefbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0x2c,0x51,0x7f
-# ATT: vscalefpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vscalefpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vscalefbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vscalefbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0x2c,0x52,0x80
-# ATT: vscalefpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vscalefpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vscalefbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vscalefbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vscalefpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vscalefpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vscalefbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vscalefbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vscalefpbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vscalefpbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vscalefbf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vscalefbf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0x2c,0x10
-# ATT: vscalefpbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vscalefpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vscalefbf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vscalefbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0x2c,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vscalefpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vscalefpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vscalefbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vscalefbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0x2c,0x51,0x7f
-# ATT: vscalefpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vscalefpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vscalefbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vscalefbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0x2c,0x52,0x80
-# ATT: vsqrtnepbf16 %xmm3, %xmm2
-# INTEL: vsqrtnepbf16 xmm2, xmm3
+# ATT: vsqrtbf16 %xmm3, %xmm2
+# INTEL: vsqrtbf16 xmm2, xmm3
0x62,0xf5,0x7d,0x08,0x51,0xd3
-# ATT: vsqrtnepbf16 %xmm3, %xmm2 {%k7}
-# INTEL: vsqrtnepbf16 xmm2 {k7}, xmm3
+# ATT: vsqrtbf16 %xmm3, %xmm2 {%k7}
+# INTEL: vsqrtbf16 xmm2 {k7}, xmm3
0x62,0xf5,0x7d,0x0f,0x51,0xd3
-# ATT: vsqrtnepbf16 %xmm3, %xmm2 {%k7} {z}
-# INTEL: vsqrtnepbf16 xmm2 {k7} {z}, xmm3
+# ATT: vsqrtbf16 %xmm3, %xmm2 {%k7} {z}
+# INTEL: vsqrtbf16 xmm2 {k7} {z}, xmm3
0x62,0xf5,0x7d,0x8f,0x51,0xd3
-# ATT: vsqrtnepbf16 %zmm3, %zmm2
-# INTEL: vsqrtnepbf16 zmm2, zmm3
+# ATT: vsqrtbf16 %zmm3, %zmm2
+# INTEL: vsqrtbf16 zmm2, zmm3
0x62,0xf5,0x7d,0x48,0x51,0xd3
-# ATT: vsqrtnepbf16 %zmm3, %zmm2 {%k7}
-# INTEL: vsqrtnepbf16 zmm2 {k7}, zmm3
+# ATT: vsqrtbf16 %zmm3, %zmm2 {%k7}
+# INTEL: vsqrtbf16 zmm2 {k7}, zmm3
0x62,0xf5,0x7d,0x4f,0x51,0xd3
-# ATT: vsqrtnepbf16 %zmm3, %zmm2 {%k7} {z}
-# INTEL: vsqrtnepbf16 zmm2 {k7} {z}, zmm3
+# ATT: vsqrtbf16 %zmm3, %zmm2 {%k7} {z}
+# INTEL: vsqrtbf16 zmm2 {k7} {z}, zmm3
0x62,0xf5,0x7d,0xcf,0x51,0xd3
-# ATT: vsqrtnepbf16 %ymm3, %ymm2
-# INTEL: vsqrtnepbf16 ymm2, ymm3
+# ATT: vsqrtbf16 %ymm3, %ymm2
+# INTEL: vsqrtbf16 ymm2, ymm3
0x62,0xf5,0x7d,0x28,0x51,0xd3
-# ATT: vsqrtnepbf16 %ymm3, %ymm2 {%k7}
-# INTEL: vsqrtnepbf16 ymm2 {k7}, ymm3
+# ATT: vsqrtbf16 %ymm3, %ymm2 {%k7}
+# INTEL: vsqrtbf16 ymm2 {k7}, ymm3
0x62,0xf5,0x7d,0x2f,0x51,0xd3
-# ATT: vsqrtnepbf16 %ymm3, %ymm2 {%k7} {z}
-# INTEL: vsqrtnepbf16 ymm2 {k7} {z}, ymm3
+# ATT: vsqrtbf16 %ymm3, %ymm2 {%k7} {z}
+# INTEL: vsqrtbf16 ymm2 {k7} {z}, ymm3
0x62,0xf5,0x7d,0xaf,0x51,0xd3
-# ATT: vsqrtnepbf16 268435456(%esp,%esi,8), %xmm2
-# INTEL: vsqrtnepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vsqrtbf16 268435456(%esp,%esi,8), %xmm2
+# INTEL: vsqrtbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x7d,0x08,0x51,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vsqrtnepbf16 291(%edi,%eax,4), %xmm2 {%k7}
-# INTEL: vsqrtnepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
+# ATT: vsqrtbf16 291(%edi,%eax,4), %xmm2 {%k7}
+# INTEL: vsqrtbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x7d,0x0f,0x51,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vsqrtnepbf16 (%eax){1to8}, %xmm2
-# INTEL: vsqrtnepbf16 xmm2, word ptr [eax]{1to8}
+# ATT: vsqrtbf16 (%eax){1to8}, %xmm2
+# INTEL: vsqrtbf16 xmm2, word ptr [eax]{1to8}
0x62,0xf5,0x7d,0x18,0x51,0x10
-# ATT: vsqrtnepbf16 -512(,%ebp,2), %xmm2
-# INTEL: vsqrtnepbf16 xmm2, xmmword ptr [2*ebp - 512]
+# ATT: vsqrtbf16 -512(,%ebp,2), %xmm2
+# INTEL: vsqrtbf16 xmm2, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x7d,0x08,0x51,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vsqrtnepbf16 2032(%ecx), %xmm2 {%k7} {z}
-# INTEL: vsqrtnepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
+# ATT: vsqrtbf16 2032(%ecx), %xmm2 {%k7} {z}
+# INTEL: vsqrtbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
0x62,0xf5,0x7d,0x8f,0x51,0x51,0x7f
-# ATT: vsqrtnepbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
-# INTEL: vsqrtnepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
+# ATT: vsqrtbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
+# INTEL: vsqrtbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
0x62,0xf5,0x7d,0x9f,0x51,0x52,0x80
-# ATT: vsqrtnepbf16 268435456(%esp,%esi,8), %ymm2
-# INTEL: vsqrtnepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vsqrtbf16 268435456(%esp,%esi,8), %ymm2
+# INTEL: vsqrtbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x7d,0x28,0x51,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vsqrtnepbf16 291(%edi,%eax,4), %ymm2 {%k7}
-# INTEL: vsqrtnepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
+# ATT: vsqrtbf16 291(%edi,%eax,4), %ymm2 {%k7}
+# INTEL: vsqrtbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x7d,0x2f,0x51,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vsqrtnepbf16 (%eax){1to16}, %ymm2
-# INTEL: vsqrtnepbf16 ymm2, word ptr [eax]{1to16}
+# ATT: vsqrtbf16 (%eax){1to16}, %ymm2
+# INTEL: vsqrtbf16 ymm2, word ptr [eax]{1to16}
0x62,0xf5,0x7d,0x38,0x51,0x10
-# ATT: vsqrtnepbf16 -1024(,%ebp,2), %ymm2
-# INTEL: vsqrtnepbf16 ymm2, ymmword ptr [2*ebp - 1024]
+# ATT: vsqrtbf16 -1024(,%ebp,2), %ymm2
+# INTEL: vsqrtbf16 ymm2, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x7d,0x28,0x51,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vsqrtnepbf16 4064(%ecx), %ymm2 {%k7} {z}
-# INTEL: vsqrtnepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
+# ATT: vsqrtbf16 4064(%ecx), %ymm2 {%k7} {z}
+# INTEL: vsqrtbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
0x62,0xf5,0x7d,0xaf,0x51,0x51,0x7f
-# ATT: vsqrtnepbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
-# INTEL: vsqrtnepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
+# ATT: vsqrtbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
+# INTEL: vsqrtbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
0x62,0xf5,0x7d,0xbf,0x51,0x52,0x80
-# ATT: vsqrtnepbf16 268435456(%esp,%esi,8), %zmm2
-# INTEL: vsqrtnepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vsqrtbf16 268435456(%esp,%esi,8), %zmm2
+# INTEL: vsqrtbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x7d,0x48,0x51,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vsqrtnepbf16 291(%edi,%eax,4), %zmm2 {%k7}
-# INTEL: vsqrtnepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
+# ATT: vsqrtbf16 291(%edi,%eax,4), %zmm2 {%k7}
+# INTEL: vsqrtbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x7d,0x4f,0x51,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vsqrtnepbf16 (%eax){1to32}, %zmm2
-# INTEL: vsqrtnepbf16 zmm2, word ptr [eax]{1to32}
+# ATT: vsqrtbf16 (%eax){1to32}, %zmm2
+# INTEL: vsqrtbf16 zmm2, word ptr [eax]{1to32}
0x62,0xf5,0x7d,0x58,0x51,0x10
-# ATT: vsqrtnepbf16 -2048(,%ebp,2), %zmm2
-# INTEL: vsqrtnepbf16 zmm2, zmmword ptr [2*ebp - 2048]
+# ATT: vsqrtbf16 -2048(,%ebp,2), %zmm2
+# INTEL: vsqrtbf16 zmm2, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x7d,0x48,0x51,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vsqrtnepbf16 8128(%ecx), %zmm2 {%k7} {z}
-# INTEL: vsqrtnepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
+# ATT: vsqrtbf16 8128(%ecx), %zmm2 {%k7} {z}
+# INTEL: vsqrtbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
0x62,0xf5,0x7d,0xcf,0x51,0x51,0x7f
-# ATT: vsqrtnepbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
-# INTEL: vsqrtnepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
+# ATT: vsqrtbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
+# INTEL: vsqrtbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
0x62,0xf5,0x7d,0xdf,0x51,0x52,0x80
-# ATT: vsubnepbf16 %ymm4, %ymm3, %ymm2
-# INTEL: vsubnepbf16 ymm2, ymm3, ymm4
+# ATT: vsubbf16 %ymm4, %ymm3, %ymm2
+# INTEL: vsubbf16 ymm2, ymm3, ymm4
0x62,0xf5,0x65,0x28,0x5c,0xd4
-# ATT: vsubnepbf16 %ymm4, %ymm3, %ymm2 {%k7}
-# INTEL: vsubnepbf16 ymm2 {k7}, ymm3, ymm4
+# ATT: vsubbf16 %ymm4, %ymm3, %ymm2 {%k7}
+# INTEL: vsubbf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf5,0x65,0x2f,0x5c,0xd4
-# ATT: vsubnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vsubnepbf16 ymm2 {k7} {z}, ymm3, ymm4
+# ATT: vsubbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vsubbf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf5,0x65,0xaf,0x5c,0xd4
-# ATT: vsubnepbf16 %zmm4, %zmm3, %zmm2
-# INTEL: vsubnepbf16 zmm2, zmm3, zmm4
+# ATT: vsubbf16 %zmm4, %zmm3, %zmm2
+# INTEL: vsubbf16 zmm2, zmm3, zmm4
0x62,0xf5,0x65,0x48,0x5c,0xd4
-# ATT: vsubnepbf16 %zmm4, %zmm3, %zmm2 {%k7}
-# INTEL: vsubnepbf16 zmm2 {k7}, zmm3, zmm4
+# ATT: vsubbf16 %zmm4, %zmm3, %zmm2 {%k7}
+# INTEL: vsubbf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf5,0x65,0x4f,0x5c,0xd4
-# ATT: vsubnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vsubnepbf16 zmm2 {k7} {z}, zmm3, zmm4
+# ATT: vsubbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vsubbf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf5,0x65,0xcf,0x5c,0xd4
-# ATT: vsubnepbf16 %xmm4, %xmm3, %xmm2
-# INTEL: vsubnepbf16 xmm2, xmm3, xmm4
+# ATT: vsubbf16 %xmm4, %xmm3, %xmm2
+# INTEL: vsubbf16 xmm2, xmm3, xmm4
0x62,0xf5,0x65,0x08,0x5c,0xd4
-# ATT: vsubnepbf16 %xmm4, %xmm3, %xmm2 {%k7}
-# INTEL: vsubnepbf16 xmm2 {k7}, xmm3, xmm4
+# ATT: vsubbf16 %xmm4, %xmm3, %xmm2 {%k7}
+# INTEL: vsubbf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf5,0x65,0x0f,0x5c,0xd4
-# ATT: vsubnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vsubnepbf16 xmm2 {k7} {z}, xmm3, xmm4
+# ATT: vsubbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vsubbf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf5,0x65,0x8f,0x5c,0xd4
-# ATT: vsubnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-# INTEL: vsubnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+# ATT: vsubbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+# INTEL: vsubbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x48,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vsubnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-# INTEL: vsubnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+# ATT: vsubbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+# INTEL: vsubbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x4f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vsubnepbf16 (%eax){1to32}, %zmm3, %zmm2
-# INTEL: vsubnepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+# ATT: vsubbf16 (%eax){1to32}, %zmm3, %zmm2
+# INTEL: vsubbf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf5,0x65,0x58,0x5c,0x10
-# ATT: vsubnepbf16 -2048(,%ebp,2), %zmm3, %zmm2
-# INTEL: vsubnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+# ATT: vsubbf16 -2048(,%ebp,2), %zmm3, %zmm2
+# INTEL: vsubbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x65,0x48,0x5c,0x14,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vsubnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-# INTEL: vsubnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+# ATT: vsubbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+# INTEL: vsubbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf5,0x65,0xcf,0x5c,0x51,0x7f
-# ATT: vsubnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-# INTEL: vsubnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+# ATT: vsubbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+# INTEL: vsubbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf5,0x65,0xdf,0x5c,0x52,0x80
-# ATT: vsubnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-# INTEL: vsubnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+# ATT: vsubbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+# INTEL: vsubbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x28,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vsubnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-# INTEL: vsubnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+# ATT: vsubbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+# INTEL: vsubbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x2f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vsubnepbf16 (%eax){1to16}, %ymm3, %ymm2
-# INTEL: vsubnepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+# ATT: vsubbf16 (%eax){1to16}, %ymm3, %ymm2
+# INTEL: vsubbf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf5,0x65,0x38,0x5c,0x10
-# ATT: vsubnepbf16 -1024(,%ebp,2), %ymm3, %ymm2
-# INTEL: vsubnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+# ATT: vsubbf16 -1024(,%ebp,2), %ymm3, %ymm2
+# INTEL: vsubbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x65,0x28,0x5c,0x14,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vsubnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-# INTEL: vsubnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+# ATT: vsubbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+# INTEL: vsubbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf5,0x65,0xaf,0x5c,0x51,0x7f
-# ATT: vsubnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-# INTEL: vsubnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+# ATT: vsubbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+# INTEL: vsubbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf5,0x65,0xbf,0x5c,0x52,0x80
-# ATT: vsubnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-# INTEL: vsubnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+# ATT: vsubbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+# INTEL: vsubbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x08,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10
-# ATT: vsubnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-# INTEL: vsubnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+# ATT: vsubbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+# INTEL: vsubbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x0f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00
-# ATT: vsubnepbf16 (%eax){1to8}, %xmm3, %xmm2
-# INTEL: vsubnepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+# ATT: vsubbf16 (%eax){1to8}, %xmm3, %xmm2
+# INTEL: vsubbf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf5,0x65,0x18,0x5c,0x10
-# ATT: vsubnepbf16 -512(,%ebp,2), %xmm3, %xmm2
-# INTEL: vsubnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+# ATT: vsubbf16 -512(,%ebp,2), %xmm3, %xmm2
+# INTEL: vsubbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x65,0x08,0x5c,0x14,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vsubnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-# INTEL: vsubnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+# ATT: vsubbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+# INTEL: vsubbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf5,0x65,0x8f,0x5c,0x51,0x7f
-# ATT: vsubnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-# INTEL: vsubnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+# ATT: vsubbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+# INTEL: vsubbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf5,0x65,0x9f,0x5c,0x52,0x80
diff --git a/llvm/test/MC/Disassembler/X86/avx10.2-bf16-64.txt b/llvm/test/MC/Disassembler/X86/avx10.2-bf16-64.txt
index 953ef8dd8a14c9..ff321ed3488c76 100644
--- a/llvm/test/MC/Disassembler/X86/avx10.2-bf16-64.txt
+++ b/llvm/test/MC/Disassembler/X86/avx10.2-bf16-64.txt
@@ -1,208 +1,208 @@
# RUN: llvm-mc --disassemble %s -triple=x86_64 | FileCheck %s --check-prefixes=ATT
# RUN: llvm-mc --disassemble %s -triple=x86_64 --output-asm-variant=1 | FileCheck %s --check-prefixes=INTEL
-# ATT: vaddnepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vaddnepbf16 ymm22, ymm23, ymm24
+# ATT: vaddbf16 %ymm24, %ymm23, %ymm22
+# INTEL: vaddbf16 ymm22, ymm23, ymm24
0x62,0x85,0x45,0x20,0x58,0xf0
-# ATT: vaddnepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vaddnepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vaddbf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vaddbf16 ymm22 {k7}, ymm23, ymm24
0x62,0x85,0x45,0x27,0x58,0xf0
-# ATT: vaddnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vaddnepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vaddbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vaddbf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x85,0x45,0xa7,0x58,0xf0
-# ATT: vaddnepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vaddnepbf16 zmm22, zmm23, zmm24
+# ATT: vaddbf16 %zmm24, %zmm23, %zmm22
+# INTEL: vaddbf16 zmm22, zmm23, zmm24
0x62,0x85,0x45,0x40,0x58,0xf0
-# ATT: vaddnepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vaddnepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vaddbf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vaddbf16 zmm22 {k7}, zmm23, zmm24
0x62,0x85,0x45,0x47,0x58,0xf0
-# ATT: vaddnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vaddnepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vaddbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vaddbf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x85,0x45,0xc7,0x58,0xf0
-# ATT: vaddnepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vaddnepbf16 xmm22, xmm23, xmm24
+# ATT: vaddbf16 %xmm24, %xmm23, %xmm22
+# INTEL: vaddbf16 xmm22, xmm23, xmm24
0x62,0x85,0x45,0x00,0x58,0xf0
-# ATT: vaddnepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vaddnepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vaddbf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vaddbf16 xmm22 {k7}, xmm23, xmm24
0x62,0x85,0x45,0x07,0x58,0xf0
-# ATT: vaddnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vaddnepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vaddbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vaddbf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x85,0x45,0x87,0x58,0xf0
-# ATT: vaddnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vaddnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vaddbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vaddbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x40,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vaddnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vaddnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vaddbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vaddbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x47,0x58,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vaddnepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vaddnepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vaddbf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vaddbf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe5,0x45,0x50,0x58,0x35,0x00,0x00,0x00,0x00
-# ATT: vaddnepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vaddnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vaddbf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vaddbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe5,0x45,0x40,0x58,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vaddnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vaddnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vaddbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vaddbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe5,0x45,0xc7,0x58,0x71,0x7f
-# ATT: vaddnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vaddnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vaddbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vaddbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe5,0x45,0xd7,0x58,0x72,0x80
-# ATT: vaddnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vaddnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vaddbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vaddbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x20,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vaddnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vaddnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vaddbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vaddbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x27,0x58,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vaddnepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vaddnepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vaddbf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vaddbf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe5,0x45,0x30,0x58,0x35,0x00,0x00,0x00,0x00
-# ATT: vaddnepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vaddnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vaddbf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vaddbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe5,0x45,0x20,0x58,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vaddnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vaddnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vaddbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vaddbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe5,0x45,0xa7,0x58,0x71,0x7f
-# ATT: vaddnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vaddnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vaddbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vaddbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe5,0x45,0xb7,0x58,0x72,0x80
-# ATT: vaddnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vaddnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vaddbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vaddbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x00,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vaddnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vaddnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vaddbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vaddbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x07,0x58,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vaddnepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vaddnepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vaddbf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vaddbf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe5,0x45,0x10,0x58,0x35,0x00,0x00,0x00,0x00
-# ATT: vaddnepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vaddnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vaddbf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vaddbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe5,0x45,0x00,0x58,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vaddnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vaddnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vaddbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vaddbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe5,0x45,0x87,0x58,0x71,0x7f
-# ATT: vaddnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vaddnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vaddbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vaddbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe5,0x45,0x97,0x58,0x72,0x80
-# ATT: vcmppbf16 $123, %ymm24, %ymm23, %k5
-# INTEL: vcmppbf16 k5, ymm23, ymm24, 123
+# ATT: vcmpbf16 $123, %ymm24, %ymm23, %k5
+# INTEL: vcmpbf16 k5, ymm23, ymm24, 123
0x62,0x93,0x47,0x20,0xc2,0xe8,0x7b
-# ATT: vcmppbf16 $123, %ymm24, %ymm23, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, ymm23, ymm24, 123
+# ATT: vcmpbf16 $123, %ymm24, %ymm23, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, ymm23, ymm24, 123
0x62,0x93,0x47,0x27,0xc2,0xe8,0x7b
-# ATT: vcmppbf16 $123, %xmm24, %xmm23, %k5
-# INTEL: vcmppbf16 k5, xmm23, xmm24, 123
+# ATT: vcmpbf16 $123, %xmm24, %xmm23, %k5
+# INTEL: vcmpbf16 k5, xmm23, xmm24, 123
0x62,0x93,0x47,0x00,0xc2,0xe8,0x7b
-# ATT: vcmppbf16 $123, %xmm24, %xmm23, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, xmm23, xmm24, 123
+# ATT: vcmpbf16 $123, %xmm24, %xmm23, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, xmm23, xmm24, 123
0x62,0x93,0x47,0x07,0xc2,0xe8,0x7b
-# ATT: vcmppbf16 $123, %zmm24, %zmm23, %k5
-# INTEL: vcmppbf16 k5, zmm23, zmm24, 123
+# ATT: vcmpbf16 $123, %zmm24, %zmm23, %k5
+# INTEL: vcmpbf16 k5, zmm23, zmm24, 123
0x62,0x93,0x47,0x40,0xc2,0xe8,0x7b
-# ATT: vcmppbf16 $123, %zmm24, %zmm23, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, zmm23, zmm24, 123
+# ATT: vcmpbf16 $123, %zmm24, %zmm23, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, zmm23, zmm24, 123
0x62,0x93,0x47,0x47,0xc2,0xe8,0x7b
-# ATT: vcmppbf16 $123, 268435456(%rbp,%r14,8), %zmm23, %k5
-# INTEL: vcmppbf16 k5, zmm23, zmmword ptr [rbp + 8*r14 + 268435456], 123
+# ATT: vcmpbf16 $123, 268435456(%rbp,%r14,8), %zmm23, %k5
+# INTEL: vcmpbf16 k5, zmm23, zmmword ptr [rbp + 8*r14 + 268435456], 123
0x62,0xb3,0x47,0x40,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b
-# ATT: vcmppbf16 $123, 291(%r8,%rax,4), %zmm23, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291], 123
+# ATT: vcmpbf16 $123, 291(%r8,%rax,4), %zmm23, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291], 123
0x62,0xd3,0x47,0x47,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b
-# ATT: vcmppbf16 $123, (%rip){1to32}, %zmm23, %k5
-# INTEL: vcmppbf16 k5, zmm23, word ptr [rip]{1to32}, 123
+# ATT: vcmpbf16 $123, (%rip){1to32}, %zmm23, %k5
+# INTEL: vcmpbf16 k5, zmm23, word ptr [rip]{1to32}, 123
0x62,0xf3,0x47,0x50,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b
-# ATT: vcmppbf16 $123, -2048(,%rbp,2), %zmm23, %k5
-# INTEL: vcmppbf16 k5, zmm23, zmmword ptr [2*rbp - 2048], 123
+# ATT: vcmpbf16 $123, -2048(,%rbp,2), %zmm23, %k5
+# INTEL: vcmpbf16 k5, zmm23, zmmword ptr [2*rbp - 2048], 123
0x62,0xf3,0x47,0x40,0xc2,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b
-# ATT: vcmppbf16 $123, 8128(%rcx), %zmm23, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, zmm23, zmmword ptr [rcx + 8128], 123
+# ATT: vcmpbf16 $123, 8128(%rcx), %zmm23, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, zmm23, zmmword ptr [rcx + 8128], 123
0x62,0xf3,0x47,0x47,0xc2,0x69,0x7f,0x7b
-# ATT: vcmppbf16 $123, -256(%rdx){1to32}, %zmm23, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, zmm23, word ptr [rdx - 256]{1to32}, 123
+# ATT: vcmpbf16 $123, -256(%rdx){1to32}, %zmm23, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, zmm23, word ptr [rdx - 256]{1to32}, 123
0x62,0xf3,0x47,0x57,0xc2,0x6a,0x80,0x7b
-# ATT: vcmppbf16 $123, 268435456(%rbp,%r14,8), %xmm23, %k5
-# INTEL: vcmppbf16 k5, xmm23, xmmword ptr [rbp + 8*r14 + 268435456], 123
+# ATT: vcmpbf16 $123, 268435456(%rbp,%r14,8), %xmm23, %k5
+# INTEL: vcmpbf16 k5, xmm23, xmmword ptr [rbp + 8*r14 + 268435456], 123
0x62,0xb3,0x47,0x00,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b
-# ATT: vcmppbf16 $123, 291(%r8,%rax,4), %xmm23, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291], 123
+# ATT: vcmpbf16 $123, 291(%r8,%rax,4), %xmm23, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291], 123
0x62,0xd3,0x47,0x07,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b
-# ATT: vcmppbf16 $123, (%rip){1to8}, %xmm23, %k5
-# INTEL: vcmppbf16 k5, xmm23, word ptr [rip]{1to8}, 123
+# ATT: vcmpbf16 $123, (%rip){1to8}, %xmm23, %k5
+# INTEL: vcmpbf16 k5, xmm23, word ptr [rip]{1to8}, 123
0x62,0xf3,0x47,0x10,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b
-# ATT: vcmppbf16 $123, -512(,%rbp,2), %xmm23, %k5
-# INTEL: vcmppbf16 k5, xmm23, xmmword ptr [2*rbp - 512], 123
+# ATT: vcmpbf16 $123, -512(,%rbp,2), %xmm23, %k5
+# INTEL: vcmpbf16 k5, xmm23, xmmword ptr [2*rbp - 512], 123
0x62,0xf3,0x47,0x00,0xc2,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b
-# ATT: vcmppbf16 $123, 2032(%rcx), %xmm23, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, xmm23, xmmword ptr [rcx + 2032], 123
+# ATT: vcmpbf16 $123, 2032(%rcx), %xmm23, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, xmm23, xmmword ptr [rcx + 2032], 123
0x62,0xf3,0x47,0x07,0xc2,0x69,0x7f,0x7b
-# ATT: vcmppbf16 $123, -256(%rdx){1to8}, %xmm23, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, xmm23, word ptr [rdx - 256]{1to8}, 123
+# ATT: vcmpbf16 $123, -256(%rdx){1to8}, %xmm23, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, xmm23, word ptr [rdx - 256]{1to8}, 123
0x62,0xf3,0x47,0x17,0xc2,0x6a,0x80,0x7b
-# ATT: vcmppbf16 $123, 268435456(%rbp,%r14,8), %ymm23, %k5
-# INTEL: vcmppbf16 k5, ymm23, ymmword ptr [rbp + 8*r14 + 268435456], 123
+# ATT: vcmpbf16 $123, 268435456(%rbp,%r14,8), %ymm23, %k5
+# INTEL: vcmpbf16 k5, ymm23, ymmword ptr [rbp + 8*r14 + 268435456], 123
0x62,0xb3,0x47,0x20,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b
-# ATT: vcmppbf16 $123, 291(%r8,%rax,4), %ymm23, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291], 123
+# ATT: vcmpbf16 $123, 291(%r8,%rax,4), %ymm23, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291], 123
0x62,0xd3,0x47,0x27,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b
-# ATT: vcmppbf16 $123, (%rip){1to16}, %ymm23, %k5
-# INTEL: vcmppbf16 k5, ymm23, word ptr [rip]{1to16}, 123
+# ATT: vcmpbf16 $123, (%rip){1to16}, %ymm23, %k5
+# INTEL: vcmpbf16 k5, ymm23, word ptr [rip]{1to16}, 123
0x62,0xf3,0x47,0x30,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b
-# ATT: vcmppbf16 $123, -1024(,%rbp,2), %ymm23, %k5
-# INTEL: vcmppbf16 k5, ymm23, ymmword ptr [2*rbp - 1024], 123
+# ATT: vcmpbf16 $123, -1024(,%rbp,2), %ymm23, %k5
+# INTEL: vcmpbf16 k5, ymm23, ymmword ptr [2*rbp - 1024], 123
0x62,0xf3,0x47,0x20,0xc2,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b
-# ATT: vcmppbf16 $123, 4064(%rcx), %ymm23, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, ymm23, ymmword ptr [rcx + 4064], 123
+# ATT: vcmpbf16 $123, 4064(%rcx), %ymm23, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, ymm23, ymmword ptr [rcx + 4064], 123
0x62,0xf3,0x47,0x27,0xc2,0x69,0x7f,0x7b
-# ATT: vcmppbf16 $123, -256(%rdx){1to16}, %ymm23, %k5 {%k7}
-# INTEL: vcmppbf16 k5 {k7}, ymm23, word ptr [rdx - 256]{1to16}, 123
+# ATT: vcmpbf16 $123, -256(%rdx){1to16}, %ymm23, %k5 {%k7}
+# INTEL: vcmpbf16 k5 {k7}, ymm23, word ptr [rdx - 256]{1to16}, 123
0x62,0xf3,0x47,0x37,0xc2,0x6a,0x80,0x7b
# ATT: vcomsbf16 %xmm23, %xmm22
@@ -233,2783 +233,2783 @@
# INTEL: vcomsbf16 xmm22, word ptr [rdx - 256]
0x62,0xe5,0x7d,0x08,0x2f,0x72,0x80
-# ATT: vdivnepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vdivnepbf16 ymm22, ymm23, ymm24
+# ATT: vdivbf16 %ymm24, %ymm23, %ymm22
+# INTEL: vdivbf16 ymm22, ymm23, ymm24
0x62,0x85,0x45,0x20,0x5e,0xf0
-# ATT: vdivnepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vdivnepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vdivbf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vdivbf16 ymm22 {k7}, ymm23, ymm24
0x62,0x85,0x45,0x27,0x5e,0xf0
-# ATT: vdivnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vdivnepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vdivbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vdivbf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x85,0x45,0xa7,0x5e,0xf0
-# ATT: vdivnepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vdivnepbf16 zmm22, zmm23, zmm24
+# ATT: vdivbf16 %zmm24, %zmm23, %zmm22
+# INTEL: vdivbf16 zmm22, zmm23, zmm24
0x62,0x85,0x45,0x40,0x5e,0xf0
-# ATT: vdivnepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vdivnepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vdivbf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vdivbf16 zmm22 {k7}, zmm23, zmm24
0x62,0x85,0x45,0x47,0x5e,0xf0
-# ATT: vdivnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vdivnepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vdivbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vdivbf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x85,0x45,0xc7,0x5e,0xf0
-# ATT: vdivnepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vdivnepbf16 xmm22, xmm23, xmm24
+# ATT: vdivbf16 %xmm24, %xmm23, %xmm22
+# INTEL: vdivbf16 xmm22, xmm23, xmm24
0x62,0x85,0x45,0x00,0x5e,0xf0
-# ATT: vdivnepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vdivnepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vdivbf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vdivbf16 xmm22 {k7}, xmm23, xmm24
0x62,0x85,0x45,0x07,0x5e,0xf0
-# ATT: vdivnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vdivnepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vdivbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vdivbf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x85,0x45,0x87,0x5e,0xf0
-# ATT: vdivnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vdivnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vdivbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vdivbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x40,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vdivnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vdivnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vdivbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vdivbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x47,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vdivnepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vdivnepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vdivbf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vdivbf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe5,0x45,0x50,0x5e,0x35,0x00,0x00,0x00,0x00
-# ATT: vdivnepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vdivnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vdivbf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vdivbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe5,0x45,0x40,0x5e,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vdivnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vdivnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vdivbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vdivbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe5,0x45,0xc7,0x5e,0x71,0x7f
-# ATT: vdivnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vdivnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vdivbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vdivbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe5,0x45,0xd7,0x5e,0x72,0x80
-# ATT: vdivnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vdivnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vdivbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vdivbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x20,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vdivnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vdivnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vdivbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vdivbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x27,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vdivnepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vdivnepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vdivbf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vdivbf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe5,0x45,0x30,0x5e,0x35,0x00,0x00,0x00,0x00
-# ATT: vdivnepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vdivnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vdivbf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vdivbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe5,0x45,0x20,0x5e,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vdivnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vdivnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vdivbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vdivbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe5,0x45,0xa7,0x5e,0x71,0x7f
-# ATT: vdivnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vdivnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vdivbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vdivbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe5,0x45,0xb7,0x5e,0x72,0x80
-# ATT: vdivnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vdivnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vdivbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vdivbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x00,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vdivnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vdivnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vdivbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vdivbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x07,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vdivnepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vdivnepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vdivbf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vdivbf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe5,0x45,0x10,0x5e,0x35,0x00,0x00,0x00,0x00
-# ATT: vdivnepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vdivnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vdivbf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vdivbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe5,0x45,0x00,0x5e,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vdivnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vdivnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vdivbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vdivbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe5,0x45,0x87,0x5e,0x71,0x7f
-# ATT: vdivnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vdivnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vdivbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vdivbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe5,0x45,0x97,0x5e,0x72,0x80
-# ATT: vfmadd132nepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vfmadd132nepbf16 ymm22, ymm23, ymm24
+# ATT: vfmadd132bf16 %ymm24, %ymm23, %ymm22
+# INTEL: vfmadd132bf16 ymm22, ymm23, ymm24
0x62,0x86,0x44,0x20,0x98,0xf0
-# ATT: vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vfmadd132nepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vfmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vfmadd132bf16 ymm22 {k7}, ymm23, ymm24
0x62,0x86,0x44,0x27,0x98,0xf0
-# ATT: vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vfmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmadd132bf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x86,0x44,0xa7,0x98,0xf0
-# ATT: vfmadd132nepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vfmadd132nepbf16 zmm22, zmm23, zmm24
+# ATT: vfmadd132bf16 %zmm24, %zmm23, %zmm22
+# INTEL: vfmadd132bf16 zmm22, zmm23, zmm24
0x62,0x86,0x44,0x40,0x98,0xf0
-# ATT: vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vfmadd132nepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vfmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vfmadd132bf16 zmm22 {k7}, zmm23, zmm24
0x62,0x86,0x44,0x47,0x98,0xf0
-# ATT: vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vfmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmadd132bf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x86,0x44,0xc7,0x98,0xf0
-# ATT: vfmadd132nepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vfmadd132nepbf16 xmm22, xmm23, xmm24
+# ATT: vfmadd132bf16 %xmm24, %xmm23, %xmm22
+# INTEL: vfmadd132bf16 xmm22, xmm23, xmm24
0x62,0x86,0x44,0x00,0x98,0xf0
-# ATT: vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vfmadd132nepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vfmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vfmadd132bf16 xmm22 {k7}, xmm23, xmm24
0x62,0x86,0x44,0x07,0x98,0xf0
-# ATT: vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vfmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmadd132bf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x86,0x44,0x87,0x98,0xf0
-# ATT: vfmadd132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vfmadd132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmadd132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vfmadd132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x40,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmadd132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vfmadd132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vfmadd132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vfmadd132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x47,0x98,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmadd132nepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vfmadd132nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vfmadd132bf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vfmadd132bf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe6,0x44,0x50,0x98,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmadd132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vfmadd132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vfmadd132bf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vfmadd132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x44,0x40,0x98,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfmadd132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vfmadd132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmadd132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe6,0x44,0xc7,0x98,0x71,0x7f
-# ATT: vfmadd132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vfmadd132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmadd132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x44,0xd7,0x98,0x72,0x80
-# ATT: vfmadd132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vfmadd132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmadd132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vfmadd132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x20,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmadd132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vfmadd132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vfmadd132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vfmadd132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x27,0x98,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmadd132nepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vfmadd132nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vfmadd132bf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vfmadd132bf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe6,0x44,0x30,0x98,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmadd132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vfmadd132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vfmadd132bf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vfmadd132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x44,0x20,0x98,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfmadd132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vfmadd132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmadd132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe6,0x44,0xa7,0x98,0x71,0x7f
-# ATT: vfmadd132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vfmadd132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmadd132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x44,0xb7,0x98,0x72,0x80
-# ATT: vfmadd132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vfmadd132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmadd132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vfmadd132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x00,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmadd132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vfmadd132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vfmadd132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vfmadd132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x07,0x98,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmadd132nepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vfmadd132nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vfmadd132bf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vfmadd132bf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe6,0x44,0x10,0x98,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmadd132nepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vfmadd132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vfmadd132bf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vfmadd132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x44,0x00,0x98,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfmadd132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vfmadd132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmadd132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe6,0x44,0x87,0x98,0x71,0x7f
-# ATT: vfmadd132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vfmadd132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmadd132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x44,0x97,0x98,0x72,0x80
-# ATT: vfmadd213nepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vfmadd213nepbf16 ymm22, ymm23, ymm24
+# ATT: vfmadd213bf16 %ymm24, %ymm23, %ymm22
+# INTEL: vfmadd213bf16 ymm22, ymm23, ymm24
0x62,0x86,0x44,0x20,0xa8,0xf0
-# ATT: vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vfmadd213nepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vfmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vfmadd213bf16 ymm22 {k7}, ymm23, ymm24
0x62,0x86,0x44,0x27,0xa8,0xf0
-# ATT: vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vfmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmadd213bf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x86,0x44,0xa7,0xa8,0xf0
-# ATT: vfmadd213nepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vfmadd213nepbf16 zmm22, zmm23, zmm24
+# ATT: vfmadd213bf16 %zmm24, %zmm23, %zmm22
+# INTEL: vfmadd213bf16 zmm22, zmm23, zmm24
0x62,0x86,0x44,0x40,0xa8,0xf0
-# ATT: vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vfmadd213nepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vfmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vfmadd213bf16 zmm22 {k7}, zmm23, zmm24
0x62,0x86,0x44,0x47,0xa8,0xf0
-# ATT: vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vfmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmadd213bf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x86,0x44,0xc7,0xa8,0xf0
-# ATT: vfmadd213nepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vfmadd213nepbf16 xmm22, xmm23, xmm24
+# ATT: vfmadd213bf16 %xmm24, %xmm23, %xmm22
+# INTEL: vfmadd213bf16 xmm22, xmm23, xmm24
0x62,0x86,0x44,0x00,0xa8,0xf0
-# ATT: vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vfmadd213nepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vfmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vfmadd213bf16 xmm22 {k7}, xmm23, xmm24
0x62,0x86,0x44,0x07,0xa8,0xf0
-# ATT: vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vfmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmadd213bf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x86,0x44,0x87,0xa8,0xf0
-# ATT: vfmadd213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vfmadd213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmadd213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vfmadd213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x40,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmadd213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vfmadd213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vfmadd213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vfmadd213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x47,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmadd213nepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vfmadd213nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vfmadd213bf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vfmadd213bf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe6,0x44,0x50,0xa8,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmadd213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vfmadd213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vfmadd213bf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vfmadd213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x44,0x40,0xa8,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfmadd213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vfmadd213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmadd213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe6,0x44,0xc7,0xa8,0x71,0x7f
-# ATT: vfmadd213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vfmadd213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmadd213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x44,0xd7,0xa8,0x72,0x80
-# ATT: vfmadd213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vfmadd213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmadd213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vfmadd213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x20,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmadd213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vfmadd213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vfmadd213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vfmadd213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x27,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmadd213nepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vfmadd213nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vfmadd213bf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vfmadd213bf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe6,0x44,0x30,0xa8,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmadd213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vfmadd213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vfmadd213bf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vfmadd213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x44,0x20,0xa8,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfmadd213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vfmadd213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmadd213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe6,0x44,0xa7,0xa8,0x71,0x7f
-# ATT: vfmadd213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vfmadd213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmadd213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x44,0xb7,0xa8,0x72,0x80
-# ATT: vfmadd213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vfmadd213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmadd213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vfmadd213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x00,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmadd213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vfmadd213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vfmadd213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vfmadd213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x07,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmadd213nepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vfmadd213nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vfmadd213bf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vfmadd213bf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe6,0x44,0x10,0xa8,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmadd213nepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vfmadd213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vfmadd213bf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vfmadd213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x44,0x00,0xa8,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfmadd213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vfmadd213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmadd213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe6,0x44,0x87,0xa8,0x71,0x7f
-# ATT: vfmadd213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vfmadd213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmadd213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x44,0x97,0xa8,0x72,0x80
-# ATT: vfmadd231nepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vfmadd231nepbf16 ymm22, ymm23, ymm24
+# ATT: vfmadd231bf16 %ymm24, %ymm23, %ymm22
+# INTEL: vfmadd231bf16 ymm22, ymm23, ymm24
0x62,0x86,0x44,0x20,0xb8,0xf0
-# ATT: vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vfmadd231nepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vfmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vfmadd231bf16 ymm22 {k7}, ymm23, ymm24
0x62,0x86,0x44,0x27,0xb8,0xf0
-# ATT: vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vfmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmadd231bf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x86,0x44,0xa7,0xb8,0xf0
-# ATT: vfmadd231nepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vfmadd231nepbf16 zmm22, zmm23, zmm24
+# ATT: vfmadd231bf16 %zmm24, %zmm23, %zmm22
+# INTEL: vfmadd231bf16 zmm22, zmm23, zmm24
0x62,0x86,0x44,0x40,0xb8,0xf0
-# ATT: vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vfmadd231nepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vfmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vfmadd231bf16 zmm22 {k7}, zmm23, zmm24
0x62,0x86,0x44,0x47,0xb8,0xf0
-# ATT: vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vfmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmadd231bf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x86,0x44,0xc7,0xb8,0xf0
-# ATT: vfmadd231nepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vfmadd231nepbf16 xmm22, xmm23, xmm24
+# ATT: vfmadd231bf16 %xmm24, %xmm23, %xmm22
+# INTEL: vfmadd231bf16 xmm22, xmm23, xmm24
0x62,0x86,0x44,0x00,0xb8,0xf0
-# ATT: vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vfmadd231nepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vfmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vfmadd231bf16 xmm22 {k7}, xmm23, xmm24
0x62,0x86,0x44,0x07,0xb8,0xf0
-# ATT: vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vfmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmadd231bf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x86,0x44,0x87,0xb8,0xf0
-# ATT: vfmadd231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vfmadd231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmadd231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vfmadd231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x40,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmadd231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vfmadd231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vfmadd231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vfmadd231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x47,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmadd231nepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vfmadd231nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vfmadd231bf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vfmadd231bf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe6,0x44,0x50,0xb8,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmadd231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vfmadd231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vfmadd231bf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vfmadd231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x44,0x40,0xb8,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfmadd231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vfmadd231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmadd231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe6,0x44,0xc7,0xb8,0x71,0x7f
-# ATT: vfmadd231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vfmadd231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmadd231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x44,0xd7,0xb8,0x72,0x80
-# ATT: vfmadd231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vfmadd231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmadd231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vfmadd231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x20,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmadd231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vfmadd231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vfmadd231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vfmadd231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x27,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmadd231nepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vfmadd231nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vfmadd231bf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vfmadd231bf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe6,0x44,0x30,0xb8,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmadd231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vfmadd231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vfmadd231bf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vfmadd231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x44,0x20,0xb8,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfmadd231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vfmadd231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmadd231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe6,0x44,0xa7,0xb8,0x71,0x7f
-# ATT: vfmadd231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vfmadd231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmadd231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x44,0xb7,0xb8,0x72,0x80
-# ATT: vfmadd231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vfmadd231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmadd231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vfmadd231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x00,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmadd231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vfmadd231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vfmadd231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vfmadd231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x07,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmadd231nepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vfmadd231nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vfmadd231bf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vfmadd231bf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe6,0x44,0x10,0xb8,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmadd231nepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vfmadd231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vfmadd231bf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vfmadd231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x44,0x00,0xb8,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfmadd231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vfmadd231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmadd231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe6,0x44,0x87,0xb8,0x71,0x7f
-# ATT: vfmadd231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vfmadd231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmadd231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x44,0x97,0xb8,0x72,0x80
-# ATT: vfmsub132nepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vfmsub132nepbf16 ymm22, ymm23, ymm24
+# ATT: vfmsub132bf16 %ymm24, %ymm23, %ymm22
+# INTEL: vfmsub132bf16 ymm22, ymm23, ymm24
0x62,0x86,0x44,0x20,0x9a,0xf0
-# ATT: vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vfmsub132nepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vfmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vfmsub132bf16 ymm22 {k7}, ymm23, ymm24
0x62,0x86,0x44,0x27,0x9a,0xf0
-# ATT: vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vfmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmsub132bf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x86,0x44,0xa7,0x9a,0xf0
-# ATT: vfmsub132nepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vfmsub132nepbf16 zmm22, zmm23, zmm24
+# ATT: vfmsub132bf16 %zmm24, %zmm23, %zmm22
+# INTEL: vfmsub132bf16 zmm22, zmm23, zmm24
0x62,0x86,0x44,0x40,0x9a,0xf0
-# ATT: vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vfmsub132nepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vfmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vfmsub132bf16 zmm22 {k7}, zmm23, zmm24
0x62,0x86,0x44,0x47,0x9a,0xf0
-# ATT: vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vfmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmsub132bf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x86,0x44,0xc7,0x9a,0xf0
-# ATT: vfmsub132nepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vfmsub132nepbf16 xmm22, xmm23, xmm24
+# ATT: vfmsub132bf16 %xmm24, %xmm23, %xmm22
+# INTEL: vfmsub132bf16 xmm22, xmm23, xmm24
0x62,0x86,0x44,0x00,0x9a,0xf0
-# ATT: vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vfmsub132nepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vfmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vfmsub132bf16 xmm22 {k7}, xmm23, xmm24
0x62,0x86,0x44,0x07,0x9a,0xf0
-# ATT: vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vfmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmsub132bf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x86,0x44,0x87,0x9a,0xf0
-# ATT: vfmsub132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vfmsub132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmsub132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vfmsub132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x40,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmsub132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vfmsub132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vfmsub132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vfmsub132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x47,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmsub132nepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vfmsub132nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vfmsub132bf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vfmsub132bf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe6,0x44,0x50,0x9a,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmsub132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vfmsub132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vfmsub132bf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vfmsub132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x44,0x40,0x9a,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfmsub132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vfmsub132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmsub132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe6,0x44,0xc7,0x9a,0x71,0x7f
-# ATT: vfmsub132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vfmsub132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmsub132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x44,0xd7,0x9a,0x72,0x80
-# ATT: vfmsub132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vfmsub132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmsub132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vfmsub132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x20,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmsub132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vfmsub132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vfmsub132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vfmsub132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x27,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmsub132nepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vfmsub132nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vfmsub132bf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vfmsub132bf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe6,0x44,0x30,0x9a,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmsub132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vfmsub132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vfmsub132bf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vfmsub132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x44,0x20,0x9a,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfmsub132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vfmsub132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmsub132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe6,0x44,0xa7,0x9a,0x71,0x7f
-# ATT: vfmsub132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vfmsub132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmsub132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x44,0xb7,0x9a,0x72,0x80
-# ATT: vfmsub132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vfmsub132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmsub132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vfmsub132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x00,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmsub132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vfmsub132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vfmsub132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vfmsub132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x07,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmsub132nepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vfmsub132nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vfmsub132bf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vfmsub132bf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe6,0x44,0x10,0x9a,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmsub132nepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vfmsub132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vfmsub132bf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vfmsub132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x44,0x00,0x9a,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfmsub132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vfmsub132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmsub132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe6,0x44,0x87,0x9a,0x71,0x7f
-# ATT: vfmsub132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vfmsub132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmsub132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x44,0x97,0x9a,0x72,0x80
-# ATT: vfmsub213nepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vfmsub213nepbf16 ymm22, ymm23, ymm24
+# ATT: vfmsub213bf16 %ymm24, %ymm23, %ymm22
+# INTEL: vfmsub213bf16 ymm22, ymm23, ymm24
0x62,0x86,0x44,0x20,0xaa,0xf0
-# ATT: vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vfmsub213nepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vfmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vfmsub213bf16 ymm22 {k7}, ymm23, ymm24
0x62,0x86,0x44,0x27,0xaa,0xf0
-# ATT: vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vfmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmsub213bf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x86,0x44,0xa7,0xaa,0xf0
-# ATT: vfmsub213nepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vfmsub213nepbf16 zmm22, zmm23, zmm24
+# ATT: vfmsub213bf16 %zmm24, %zmm23, %zmm22
+# INTEL: vfmsub213bf16 zmm22, zmm23, zmm24
0x62,0x86,0x44,0x40,0xaa,0xf0
-# ATT: vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vfmsub213nepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vfmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vfmsub213bf16 zmm22 {k7}, zmm23, zmm24
0x62,0x86,0x44,0x47,0xaa,0xf0
-# ATT: vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vfmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmsub213bf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x86,0x44,0xc7,0xaa,0xf0
-# ATT: vfmsub213nepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vfmsub213nepbf16 xmm22, xmm23, xmm24
+# ATT: vfmsub213bf16 %xmm24, %xmm23, %xmm22
+# INTEL: vfmsub213bf16 xmm22, xmm23, xmm24
0x62,0x86,0x44,0x00,0xaa,0xf0
-# ATT: vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vfmsub213nepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vfmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vfmsub213bf16 xmm22 {k7}, xmm23, xmm24
0x62,0x86,0x44,0x07,0xaa,0xf0
-# ATT: vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vfmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmsub213bf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x86,0x44,0x87,0xaa,0xf0
-# ATT: vfmsub213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vfmsub213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmsub213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vfmsub213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x40,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmsub213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vfmsub213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vfmsub213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vfmsub213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x47,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmsub213nepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vfmsub213nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vfmsub213bf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vfmsub213bf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe6,0x44,0x50,0xaa,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmsub213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vfmsub213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vfmsub213bf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vfmsub213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x44,0x40,0xaa,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfmsub213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vfmsub213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmsub213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe6,0x44,0xc7,0xaa,0x71,0x7f
-# ATT: vfmsub213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vfmsub213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmsub213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x44,0xd7,0xaa,0x72,0x80
-# ATT: vfmsub213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vfmsub213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmsub213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vfmsub213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x20,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmsub213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vfmsub213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vfmsub213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vfmsub213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x27,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmsub213nepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vfmsub213nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vfmsub213bf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vfmsub213bf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe6,0x44,0x30,0xaa,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmsub213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vfmsub213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vfmsub213bf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vfmsub213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x44,0x20,0xaa,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfmsub213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vfmsub213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmsub213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe6,0x44,0xa7,0xaa,0x71,0x7f
-# ATT: vfmsub213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vfmsub213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmsub213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x44,0xb7,0xaa,0x72,0x80
-# ATT: vfmsub213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vfmsub213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmsub213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vfmsub213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x00,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmsub213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vfmsub213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vfmsub213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vfmsub213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x07,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmsub213nepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vfmsub213nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vfmsub213bf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vfmsub213bf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe6,0x44,0x10,0xaa,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmsub213nepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vfmsub213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vfmsub213bf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vfmsub213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x44,0x00,0xaa,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfmsub213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vfmsub213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmsub213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe6,0x44,0x87,0xaa,0x71,0x7f
-# ATT: vfmsub213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vfmsub213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmsub213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x44,0x97,0xaa,0x72,0x80
-# ATT: vfmsub231nepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vfmsub231nepbf16 ymm22, ymm23, ymm24
+# ATT: vfmsub231bf16 %ymm24, %ymm23, %ymm22
+# INTEL: vfmsub231bf16 ymm22, ymm23, ymm24
0x62,0x86,0x44,0x20,0xba,0xf0
-# ATT: vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vfmsub231nepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vfmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vfmsub231bf16 ymm22 {k7}, ymm23, ymm24
0x62,0x86,0x44,0x27,0xba,0xf0
-# ATT: vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vfmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmsub231bf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x86,0x44,0xa7,0xba,0xf0
-# ATT: vfmsub231nepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vfmsub231nepbf16 zmm22, zmm23, zmm24
+# ATT: vfmsub231bf16 %zmm24, %zmm23, %zmm22
+# INTEL: vfmsub231bf16 zmm22, zmm23, zmm24
0x62,0x86,0x44,0x40,0xba,0xf0
-# ATT: vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vfmsub231nepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vfmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vfmsub231bf16 zmm22 {k7}, zmm23, zmm24
0x62,0x86,0x44,0x47,0xba,0xf0
-# ATT: vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vfmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmsub231bf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x86,0x44,0xc7,0xba,0xf0
-# ATT: vfmsub231nepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vfmsub231nepbf16 xmm22, xmm23, xmm24
+# ATT: vfmsub231bf16 %xmm24, %xmm23, %xmm22
+# INTEL: vfmsub231bf16 xmm22, xmm23, xmm24
0x62,0x86,0x44,0x00,0xba,0xf0
-# ATT: vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vfmsub231nepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vfmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vfmsub231bf16 xmm22 {k7}, xmm23, xmm24
0x62,0x86,0x44,0x07,0xba,0xf0
-# ATT: vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vfmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmsub231bf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x86,0x44,0x87,0xba,0xf0
-# ATT: vfmsub231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vfmsub231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmsub231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vfmsub231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x40,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmsub231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vfmsub231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vfmsub231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vfmsub231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x47,0xba,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmsub231nepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vfmsub231nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vfmsub231bf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vfmsub231bf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe6,0x44,0x50,0xba,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmsub231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vfmsub231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vfmsub231bf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vfmsub231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x44,0x40,0xba,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfmsub231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vfmsub231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmsub231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe6,0x44,0xc7,0xba,0x71,0x7f
-# ATT: vfmsub231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vfmsub231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfmsub231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x44,0xd7,0xba,0x72,0x80
-# ATT: vfmsub231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vfmsub231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmsub231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vfmsub231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x20,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmsub231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vfmsub231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vfmsub231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vfmsub231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x27,0xba,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmsub231nepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vfmsub231nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vfmsub231bf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vfmsub231bf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe6,0x44,0x30,0xba,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmsub231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vfmsub231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vfmsub231bf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vfmsub231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x44,0x20,0xba,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfmsub231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vfmsub231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmsub231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe6,0x44,0xa7,0xba,0x71,0x7f
-# ATT: vfmsub231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vfmsub231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfmsub231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x44,0xb7,0xba,0x72,0x80
-# ATT: vfmsub231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vfmsub231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfmsub231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vfmsub231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x00,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfmsub231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vfmsub231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vfmsub231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vfmsub231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x07,0xba,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfmsub231nepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vfmsub231nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vfmsub231bf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vfmsub231bf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe6,0x44,0x10,0xba,0x35,0x00,0x00,0x00,0x00
-# ATT: vfmsub231nepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vfmsub231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vfmsub231bf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vfmsub231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x44,0x00,0xba,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfmsub231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vfmsub231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmsub231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe6,0x44,0x87,0xba,0x71,0x7f
-# ATT: vfmsub231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vfmsub231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfmsub231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x44,0x97,0xba,0x72,0x80
-# ATT: vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vfnmadd132nepbf16 ymm22, ymm23, ymm24
+# ATT: vfnmadd132bf16 %ymm24, %ymm23, %ymm22
+# INTEL: vfnmadd132bf16 ymm22, ymm23, ymm24
0x62,0x86,0x44,0x20,0x9c,0xf0
-# ATT: vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vfnmadd132nepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vfnmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vfnmadd132bf16 ymm22 {k7}, ymm23, ymm24
0x62,0x86,0x44,0x27,0x9c,0xf0
-# ATT: vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vfnmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmadd132bf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x86,0x44,0xa7,0x9c,0xf0
-# ATT: vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vfnmadd132nepbf16 zmm22, zmm23, zmm24
+# ATT: vfnmadd132bf16 %zmm24, %zmm23, %zmm22
+# INTEL: vfnmadd132bf16 zmm22, zmm23, zmm24
0x62,0x86,0x44,0x40,0x9c,0xf0
-# ATT: vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vfnmadd132nepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vfnmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vfnmadd132bf16 zmm22 {k7}, zmm23, zmm24
0x62,0x86,0x44,0x47,0x9c,0xf0
-# ATT: vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vfnmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmadd132bf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x86,0x44,0xc7,0x9c,0xf0
-# ATT: vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vfnmadd132nepbf16 xmm22, xmm23, xmm24
+# ATT: vfnmadd132bf16 %xmm24, %xmm23, %xmm22
+# INTEL: vfnmadd132bf16 xmm22, xmm23, xmm24
0x62,0x86,0x44,0x00,0x9c,0xf0
-# ATT: vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vfnmadd132nepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vfnmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vfnmadd132bf16 xmm22 {k7}, xmm23, xmm24
0x62,0x86,0x44,0x07,0x9c,0xf0
-# ATT: vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vfnmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmadd132bf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x86,0x44,0x87,0x9c,0xf0
-# ATT: vfnmadd132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vfnmadd132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmadd132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vfnmadd132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x40,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmadd132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vfnmadd132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmadd132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vfnmadd132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x47,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmadd132nepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vfnmadd132nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vfnmadd132bf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vfnmadd132bf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe6,0x44,0x50,0x9c,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmadd132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vfnmadd132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vfnmadd132bf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vfnmadd132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x44,0x40,0x9c,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfnmadd132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vfnmadd132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmadd132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe6,0x44,0xc7,0x9c,0x71,0x7f
-# ATT: vfnmadd132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vfnmadd132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmadd132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x44,0xd7,0x9c,0x72,0x80
-# ATT: vfnmadd132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vfnmadd132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmadd132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vfnmadd132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x20,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmadd132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vfnmadd132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmadd132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vfnmadd132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x27,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmadd132nepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vfnmadd132nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vfnmadd132bf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vfnmadd132bf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe6,0x44,0x30,0x9c,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmadd132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vfnmadd132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vfnmadd132bf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vfnmadd132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x44,0x20,0x9c,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfnmadd132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vfnmadd132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmadd132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe6,0x44,0xa7,0x9c,0x71,0x7f
-# ATT: vfnmadd132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vfnmadd132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmadd132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x44,0xb7,0x9c,0x72,0x80
-# ATT: vfnmadd132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vfnmadd132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmadd132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vfnmadd132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x00,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmadd132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vfnmadd132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmadd132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vfnmadd132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x07,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmadd132nepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vfnmadd132nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vfnmadd132bf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vfnmadd132bf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe6,0x44,0x10,0x9c,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmadd132nepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vfnmadd132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vfnmadd132bf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vfnmadd132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x44,0x00,0x9c,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfnmadd132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vfnmadd132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmadd132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe6,0x44,0x87,0x9c,0x71,0x7f
-# ATT: vfnmadd132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vfnmadd132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmadd132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x44,0x97,0x9c,0x72,0x80
-# ATT: vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vfnmadd213nepbf16 ymm22, ymm23, ymm24
+# ATT: vfnmadd213bf16 %ymm24, %ymm23, %ymm22
+# INTEL: vfnmadd213bf16 ymm22, ymm23, ymm24
0x62,0x86,0x44,0x20,0xac,0xf0
-# ATT: vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vfnmadd213nepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vfnmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vfnmadd213bf16 ymm22 {k7}, ymm23, ymm24
0x62,0x86,0x44,0x27,0xac,0xf0
-# ATT: vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vfnmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmadd213bf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x86,0x44,0xa7,0xac,0xf0
-# ATT: vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vfnmadd213nepbf16 zmm22, zmm23, zmm24
+# ATT: vfnmadd213bf16 %zmm24, %zmm23, %zmm22
+# INTEL: vfnmadd213bf16 zmm22, zmm23, zmm24
0x62,0x86,0x44,0x40,0xac,0xf0
-# ATT: vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vfnmadd213nepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vfnmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vfnmadd213bf16 zmm22 {k7}, zmm23, zmm24
0x62,0x86,0x44,0x47,0xac,0xf0
-# ATT: vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vfnmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmadd213bf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x86,0x44,0xc7,0xac,0xf0
-# ATT: vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vfnmadd213nepbf16 xmm22, xmm23, xmm24
+# ATT: vfnmadd213bf16 %xmm24, %xmm23, %xmm22
+# INTEL: vfnmadd213bf16 xmm22, xmm23, xmm24
0x62,0x86,0x44,0x00,0xac,0xf0
-# ATT: vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vfnmadd213nepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vfnmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vfnmadd213bf16 xmm22 {k7}, xmm23, xmm24
0x62,0x86,0x44,0x07,0xac,0xf0
-# ATT: vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vfnmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmadd213bf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x86,0x44,0x87,0xac,0xf0
-# ATT: vfnmadd213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vfnmadd213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmadd213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vfnmadd213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x40,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmadd213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vfnmadd213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmadd213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vfnmadd213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x47,0xac,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmadd213nepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vfnmadd213nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vfnmadd213bf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vfnmadd213bf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe6,0x44,0x50,0xac,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmadd213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vfnmadd213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vfnmadd213bf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vfnmadd213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x44,0x40,0xac,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfnmadd213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vfnmadd213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmadd213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe6,0x44,0xc7,0xac,0x71,0x7f
-# ATT: vfnmadd213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vfnmadd213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmadd213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x44,0xd7,0xac,0x72,0x80
-# ATT: vfnmadd213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vfnmadd213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmadd213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vfnmadd213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x20,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmadd213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vfnmadd213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmadd213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vfnmadd213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x27,0xac,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmadd213nepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vfnmadd213nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vfnmadd213bf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vfnmadd213bf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe6,0x44,0x30,0xac,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmadd213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vfnmadd213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vfnmadd213bf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vfnmadd213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x44,0x20,0xac,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfnmadd213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vfnmadd213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmadd213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe6,0x44,0xa7,0xac,0x71,0x7f
-# ATT: vfnmadd213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vfnmadd213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmadd213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x44,0xb7,0xac,0x72,0x80
-# ATT: vfnmadd213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vfnmadd213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmadd213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vfnmadd213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x00,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmadd213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vfnmadd213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmadd213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vfnmadd213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x07,0xac,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmadd213nepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vfnmadd213nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vfnmadd213bf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vfnmadd213bf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe6,0x44,0x10,0xac,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmadd213nepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vfnmadd213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vfnmadd213bf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vfnmadd213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x44,0x00,0xac,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfnmadd213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vfnmadd213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmadd213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe6,0x44,0x87,0xac,0x71,0x7f
-# ATT: vfnmadd213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vfnmadd213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmadd213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x44,0x97,0xac,0x72,0x80
-# ATT: vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vfnmadd231nepbf16 ymm22, ymm23, ymm24
+# ATT: vfnmadd231bf16 %ymm24, %ymm23, %ymm22
+# INTEL: vfnmadd231bf16 ymm22, ymm23, ymm24
0x62,0x86,0x44,0x20,0xbc,0xf0
-# ATT: vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vfnmadd231nepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vfnmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vfnmadd231bf16 ymm22 {k7}, ymm23, ymm24
0x62,0x86,0x44,0x27,0xbc,0xf0
-# ATT: vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vfnmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmadd231bf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x86,0x44,0xa7,0xbc,0xf0
-# ATT: vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vfnmadd231nepbf16 zmm22, zmm23, zmm24
+# ATT: vfnmadd231bf16 %zmm24, %zmm23, %zmm22
+# INTEL: vfnmadd231bf16 zmm22, zmm23, zmm24
0x62,0x86,0x44,0x40,0xbc,0xf0
-# ATT: vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vfnmadd231nepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vfnmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vfnmadd231bf16 zmm22 {k7}, zmm23, zmm24
0x62,0x86,0x44,0x47,0xbc,0xf0
-# ATT: vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vfnmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmadd231bf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x86,0x44,0xc7,0xbc,0xf0
-# ATT: vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vfnmadd231nepbf16 xmm22, xmm23, xmm24
+# ATT: vfnmadd231bf16 %xmm24, %xmm23, %xmm22
+# INTEL: vfnmadd231bf16 xmm22, xmm23, xmm24
0x62,0x86,0x44,0x00,0xbc,0xf0
-# ATT: vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vfnmadd231nepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vfnmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vfnmadd231bf16 xmm22 {k7}, xmm23, xmm24
0x62,0x86,0x44,0x07,0xbc,0xf0
-# ATT: vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vfnmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmadd231bf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x86,0x44,0x87,0xbc,0xf0
-# ATT: vfnmadd231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vfnmadd231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmadd231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vfnmadd231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x40,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmadd231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vfnmadd231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmadd231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vfnmadd231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x47,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmadd231nepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vfnmadd231nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vfnmadd231bf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vfnmadd231bf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe6,0x44,0x50,0xbc,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmadd231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vfnmadd231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vfnmadd231bf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vfnmadd231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x44,0x40,0xbc,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfnmadd231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vfnmadd231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmadd231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe6,0x44,0xc7,0xbc,0x71,0x7f
-# ATT: vfnmadd231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vfnmadd231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmadd231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x44,0xd7,0xbc,0x72,0x80
-# ATT: vfnmadd231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vfnmadd231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmadd231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vfnmadd231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x20,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmadd231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vfnmadd231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmadd231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vfnmadd231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x27,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmadd231nepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vfnmadd231nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vfnmadd231bf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vfnmadd231bf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe6,0x44,0x30,0xbc,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmadd231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vfnmadd231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vfnmadd231bf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vfnmadd231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x44,0x20,0xbc,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfnmadd231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vfnmadd231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmadd231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe6,0x44,0xa7,0xbc,0x71,0x7f
-# ATT: vfnmadd231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vfnmadd231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmadd231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x44,0xb7,0xbc,0x72,0x80
-# ATT: vfnmadd231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vfnmadd231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmadd231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vfnmadd231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x00,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmadd231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vfnmadd231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmadd231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vfnmadd231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x07,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmadd231nepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vfnmadd231nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vfnmadd231bf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vfnmadd231bf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe6,0x44,0x10,0xbc,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmadd231nepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vfnmadd231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vfnmadd231bf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vfnmadd231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x44,0x00,0xbc,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfnmadd231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vfnmadd231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmadd231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe6,0x44,0x87,0xbc,0x71,0x7f
-# ATT: vfnmadd231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vfnmadd231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmadd231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x44,0x97,0xbc,0x72,0x80
-# ATT: vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vfnmsub132nepbf16 ymm22, ymm23, ymm24
+# ATT: vfnmsub132bf16 %ymm24, %ymm23, %ymm22
+# INTEL: vfnmsub132bf16 ymm22, ymm23, ymm24
0x62,0x86,0x44,0x20,0x9e,0xf0
-# ATT: vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vfnmsub132nepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vfnmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vfnmsub132bf16 ymm22 {k7}, ymm23, ymm24
0x62,0x86,0x44,0x27,0x9e,0xf0
-# ATT: vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vfnmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmsub132bf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x86,0x44,0xa7,0x9e,0xf0
-# ATT: vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vfnmsub132nepbf16 zmm22, zmm23, zmm24
+# ATT: vfnmsub132bf16 %zmm24, %zmm23, %zmm22
+# INTEL: vfnmsub132bf16 zmm22, zmm23, zmm24
0x62,0x86,0x44,0x40,0x9e,0xf0
-# ATT: vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vfnmsub132nepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vfnmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vfnmsub132bf16 zmm22 {k7}, zmm23, zmm24
0x62,0x86,0x44,0x47,0x9e,0xf0
-# ATT: vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vfnmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmsub132bf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x86,0x44,0xc7,0x9e,0xf0
-# ATT: vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vfnmsub132nepbf16 xmm22, xmm23, xmm24
+# ATT: vfnmsub132bf16 %xmm24, %xmm23, %xmm22
+# INTEL: vfnmsub132bf16 xmm22, xmm23, xmm24
0x62,0x86,0x44,0x00,0x9e,0xf0
-# ATT: vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vfnmsub132nepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vfnmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vfnmsub132bf16 xmm22 {k7}, xmm23, xmm24
0x62,0x86,0x44,0x07,0x9e,0xf0
-# ATT: vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vfnmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmsub132bf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x86,0x44,0x87,0x9e,0xf0
-# ATT: vfnmsub132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vfnmsub132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmsub132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vfnmsub132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x40,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmsub132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vfnmsub132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmsub132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vfnmsub132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x47,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmsub132nepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vfnmsub132nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vfnmsub132bf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vfnmsub132bf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe6,0x44,0x50,0x9e,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmsub132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vfnmsub132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vfnmsub132bf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vfnmsub132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x44,0x40,0x9e,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfnmsub132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vfnmsub132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmsub132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe6,0x44,0xc7,0x9e,0x71,0x7f
-# ATT: vfnmsub132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vfnmsub132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmsub132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x44,0xd7,0x9e,0x72,0x80
-# ATT: vfnmsub132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vfnmsub132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmsub132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vfnmsub132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x20,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmsub132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vfnmsub132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmsub132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vfnmsub132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x27,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmsub132nepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vfnmsub132nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vfnmsub132bf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vfnmsub132bf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe6,0x44,0x30,0x9e,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmsub132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vfnmsub132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vfnmsub132bf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vfnmsub132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x44,0x20,0x9e,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfnmsub132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vfnmsub132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmsub132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe6,0x44,0xa7,0x9e,0x71,0x7f
-# ATT: vfnmsub132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vfnmsub132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmsub132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x44,0xb7,0x9e,0x72,0x80
-# ATT: vfnmsub132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vfnmsub132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmsub132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vfnmsub132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x00,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmsub132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vfnmsub132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmsub132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vfnmsub132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x07,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmsub132nepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vfnmsub132nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vfnmsub132bf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vfnmsub132bf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe6,0x44,0x10,0x9e,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmsub132nepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vfnmsub132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vfnmsub132bf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vfnmsub132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x44,0x00,0x9e,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfnmsub132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vfnmsub132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmsub132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe6,0x44,0x87,0x9e,0x71,0x7f
-# ATT: vfnmsub132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vfnmsub132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmsub132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x44,0x97,0x9e,0x72,0x80
-# ATT: vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vfnmsub213nepbf16 ymm22, ymm23, ymm24
+# ATT: vfnmsub213bf16 %ymm24, %ymm23, %ymm22
+# INTEL: vfnmsub213bf16 ymm22, ymm23, ymm24
0x62,0x86,0x44,0x20,0xae,0xf0
-# ATT: vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vfnmsub213nepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vfnmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vfnmsub213bf16 ymm22 {k7}, ymm23, ymm24
0x62,0x86,0x44,0x27,0xae,0xf0
-# ATT: vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vfnmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmsub213bf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x86,0x44,0xa7,0xae,0xf0
-# ATT: vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vfnmsub213nepbf16 zmm22, zmm23, zmm24
+# ATT: vfnmsub213bf16 %zmm24, %zmm23, %zmm22
+# INTEL: vfnmsub213bf16 zmm22, zmm23, zmm24
0x62,0x86,0x44,0x40,0xae,0xf0
-# ATT: vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vfnmsub213nepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vfnmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vfnmsub213bf16 zmm22 {k7}, zmm23, zmm24
0x62,0x86,0x44,0x47,0xae,0xf0
-# ATT: vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vfnmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmsub213bf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x86,0x44,0xc7,0xae,0xf0
-# ATT: vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vfnmsub213nepbf16 xmm22, xmm23, xmm24
+# ATT: vfnmsub213bf16 %xmm24, %xmm23, %xmm22
+# INTEL: vfnmsub213bf16 xmm22, xmm23, xmm24
0x62,0x86,0x44,0x00,0xae,0xf0
-# ATT: vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vfnmsub213nepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vfnmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vfnmsub213bf16 xmm22 {k7}, xmm23, xmm24
0x62,0x86,0x44,0x07,0xae,0xf0
-# ATT: vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vfnmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmsub213bf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x86,0x44,0x87,0xae,0xf0
-# ATT: vfnmsub213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vfnmsub213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmsub213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vfnmsub213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x40,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmsub213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vfnmsub213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmsub213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vfnmsub213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x47,0xae,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmsub213nepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vfnmsub213nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vfnmsub213bf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vfnmsub213bf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe6,0x44,0x50,0xae,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmsub213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vfnmsub213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vfnmsub213bf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vfnmsub213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x44,0x40,0xae,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfnmsub213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vfnmsub213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmsub213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe6,0x44,0xc7,0xae,0x71,0x7f
-# ATT: vfnmsub213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vfnmsub213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmsub213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x44,0xd7,0xae,0x72,0x80
-# ATT: vfnmsub213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vfnmsub213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmsub213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vfnmsub213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x20,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmsub213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vfnmsub213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmsub213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vfnmsub213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x27,0xae,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmsub213nepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vfnmsub213nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vfnmsub213bf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vfnmsub213bf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe6,0x44,0x30,0xae,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmsub213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vfnmsub213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vfnmsub213bf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vfnmsub213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x44,0x20,0xae,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfnmsub213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vfnmsub213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmsub213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe6,0x44,0xa7,0xae,0x71,0x7f
-# ATT: vfnmsub213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vfnmsub213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmsub213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x44,0xb7,0xae,0x72,0x80
-# ATT: vfnmsub213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vfnmsub213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmsub213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vfnmsub213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x00,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmsub213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vfnmsub213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmsub213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vfnmsub213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x07,0xae,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmsub213nepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vfnmsub213nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vfnmsub213bf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vfnmsub213bf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe6,0x44,0x10,0xae,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmsub213nepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vfnmsub213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vfnmsub213bf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vfnmsub213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x44,0x00,0xae,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfnmsub213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vfnmsub213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmsub213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe6,0x44,0x87,0xae,0x71,0x7f
-# ATT: vfnmsub213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vfnmsub213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmsub213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x44,0x97,0xae,0x72,0x80
-# ATT: vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vfnmsub231nepbf16 ymm22, ymm23, ymm24
+# ATT: vfnmsub231bf16 %ymm24, %ymm23, %ymm22
+# INTEL: vfnmsub231bf16 ymm22, ymm23, ymm24
0x62,0x86,0x44,0x20,0xbe,0xf0
-# ATT: vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vfnmsub231nepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vfnmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vfnmsub231bf16 ymm22 {k7}, ymm23, ymm24
0x62,0x86,0x44,0x27,0xbe,0xf0
-# ATT: vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vfnmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmsub231bf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x86,0x44,0xa7,0xbe,0xf0
-# ATT: vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vfnmsub231nepbf16 zmm22, zmm23, zmm24
+# ATT: vfnmsub231bf16 %zmm24, %zmm23, %zmm22
+# INTEL: vfnmsub231bf16 zmm22, zmm23, zmm24
0x62,0x86,0x44,0x40,0xbe,0xf0
-# ATT: vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vfnmsub231nepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vfnmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vfnmsub231bf16 zmm22 {k7}, zmm23, zmm24
0x62,0x86,0x44,0x47,0xbe,0xf0
-# ATT: vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vfnmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmsub231bf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x86,0x44,0xc7,0xbe,0xf0
-# ATT: vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vfnmsub231nepbf16 xmm22, xmm23, xmm24
+# ATT: vfnmsub231bf16 %xmm24, %xmm23, %xmm22
+# INTEL: vfnmsub231bf16 xmm22, xmm23, xmm24
0x62,0x86,0x44,0x00,0xbe,0xf0
-# ATT: vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vfnmsub231nepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vfnmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vfnmsub231bf16 xmm22 {k7}, xmm23, xmm24
0x62,0x86,0x44,0x07,0xbe,0xf0
-# ATT: vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vfnmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmsub231bf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x86,0x44,0x87,0xbe,0xf0
-# ATT: vfnmsub231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vfnmsub231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmsub231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vfnmsub231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x40,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmsub231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vfnmsub231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmsub231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vfnmsub231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x47,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmsub231nepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vfnmsub231nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vfnmsub231bf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vfnmsub231bf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe6,0x44,0x50,0xbe,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmsub231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vfnmsub231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vfnmsub231bf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vfnmsub231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x44,0x40,0xbe,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vfnmsub231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vfnmsub231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmsub231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe6,0x44,0xc7,0xbe,0x71,0x7f
-# ATT: vfnmsub231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vfnmsub231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vfnmsub231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x44,0xd7,0xbe,0x72,0x80
-# ATT: vfnmsub231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vfnmsub231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmsub231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vfnmsub231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x20,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmsub231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vfnmsub231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmsub231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vfnmsub231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x27,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmsub231nepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vfnmsub231nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vfnmsub231bf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vfnmsub231bf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe6,0x44,0x30,0xbe,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmsub231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vfnmsub231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vfnmsub231bf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vfnmsub231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x44,0x20,0xbe,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vfnmsub231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vfnmsub231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmsub231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe6,0x44,0xa7,0xbe,0x71,0x7f
-# ATT: vfnmsub231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vfnmsub231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vfnmsub231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x44,0xb7,0xbe,0x72,0x80
-# ATT: vfnmsub231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vfnmsub231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vfnmsub231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vfnmsub231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x00,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vfnmsub231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vfnmsub231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vfnmsub231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vfnmsub231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x07,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vfnmsub231nepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vfnmsub231nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vfnmsub231bf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vfnmsub231bf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe6,0x44,0x10,0xbe,0x35,0x00,0x00,0x00,0x00
-# ATT: vfnmsub231nepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vfnmsub231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vfnmsub231bf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vfnmsub231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x44,0x00,0xbe,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vfnmsub231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vfnmsub231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmsub231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe6,0x44,0x87,0xbe,0x71,0x7f
-# ATT: vfnmsub231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vfnmsub231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vfnmsub231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x44,0x97,0xbe,0x72,0x80
-# ATT: vfpclasspbf16 $123, %zmm23, %k5
-# INTEL: vfpclasspbf16 k5, zmm23, 123
+# ATT: vfpclassbf16 $123, %zmm23, %k5
+# INTEL: vfpclassbf16 k5, zmm23, 123
0x62,0xb3,0x7f,0x48,0x66,0xef,0x7b
-# ATT: vfpclasspbf16 $123, %zmm23, %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, zmm23, 123
+# ATT: vfpclassbf16 $123, %zmm23, %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, zmm23, 123
0x62,0xb3,0x7f,0x4f,0x66,0xef,0x7b
-# ATT: vfpclasspbf16 $123, %ymm23, %k5
-# INTEL: vfpclasspbf16 k5, ymm23, 123
+# ATT: vfpclassbf16 $123, %ymm23, %k5
+# INTEL: vfpclassbf16 k5, ymm23, 123
0x62,0xb3,0x7f,0x28,0x66,0xef,0x7b
-# ATT: vfpclasspbf16 $123, %ymm23, %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, ymm23, 123
+# ATT: vfpclassbf16 $123, %ymm23, %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, ymm23, 123
0x62,0xb3,0x7f,0x2f,0x66,0xef,0x7b
-# ATT: vfpclasspbf16 $123, %xmm23, %k5
-# INTEL: vfpclasspbf16 k5, xmm23, 123
+# ATT: vfpclassbf16 $123, %xmm23, %k5
+# INTEL: vfpclassbf16 k5, xmm23, 123
0x62,0xb3,0x7f,0x08,0x66,0xef,0x7b
-# ATT: vfpclasspbf16 $123, %xmm23, %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, xmm23, 123
+# ATT: vfpclassbf16 $123, %xmm23, %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, xmm23, 123
0x62,0xb3,0x7f,0x0f,0x66,0xef,0x7b
-# ATT: vfpclasspbf16x $123, 268435456(%rbp,%r14,8), %k5
-# INTEL: vfpclasspbf16 k5, xmmword ptr [rbp + 8*r14 + 268435456], 123
+# ATT: vfpclassbf16x $123, 268435456(%rbp,%r14,8), %k5
+# INTEL: vfpclassbf16 k5, xmmword ptr [rbp + 8*r14 + 268435456], 123
0x62,0xb3,0x7f,0x08,0x66,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b
-# ATT: vfpclasspbf16x $123, 291(%r8,%rax,4), %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
+# ATT: vfpclassbf16x $123, 291(%r8,%rax,4), %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
0x62,0xd3,0x7f,0x0f,0x66,0xac,0x80,0x23,0x01,0x00,0x00,0x7b
-# ATT: vfpclasspbf16 $123, (%rip){1to8}, %k5
-# INTEL: vfpclasspbf16 k5, word ptr [rip]{1to8}, 123
+# ATT: vfpclassbf16 $123, (%rip){1to8}, %k5
+# INTEL: vfpclassbf16 k5, word ptr [rip]{1to8}, 123
0x62,0xf3,0x7f,0x18,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b
-# ATT: vfpclasspbf16x $123, -512(,%rbp,2), %k5
-# INTEL: vfpclasspbf16 k5, xmmword ptr [2*rbp - 512], 123
+# ATT: vfpclassbf16x $123, -512(,%rbp,2), %k5
+# INTEL: vfpclassbf16 k5, xmmword ptr [2*rbp - 512], 123
0x62,0xf3,0x7f,0x08,0x66,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b
-# ATT: vfpclasspbf16x $123, 2032(%rcx), %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, xmmword ptr [rcx + 2032], 123
+# ATT: vfpclassbf16x $123, 2032(%rcx), %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, xmmword ptr [rcx + 2032], 123
0x62,0xf3,0x7f,0x0f,0x66,0x69,0x7f,0x7b
-# ATT: vfpclasspbf16 $123, -256(%rdx){1to8}, %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to8}, 123
+# ATT: vfpclassbf16 $123, -256(%rdx){1to8}, %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to8}, 123
0x62,0xf3,0x7f,0x1f,0x66,0x6a,0x80,0x7b
-# ATT: vfpclasspbf16 $123, (%rip){1to16}, %k5
-# INTEL: vfpclasspbf16 k5, word ptr [rip]{1to16}, 123
+# ATT: vfpclassbf16 $123, (%rip){1to16}, %k5
+# INTEL: vfpclassbf16 k5, word ptr [rip]{1to16}, 123
0x62,0xf3,0x7f,0x38,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b
-# ATT: vfpclasspbf16y $123, -1024(,%rbp,2), %k5
-# INTEL: vfpclasspbf16 k5, ymmword ptr [2*rbp - 1024], 123
+# ATT: vfpclassbf16y $123, -1024(,%rbp,2), %k5
+# INTEL: vfpclassbf16 k5, ymmword ptr [2*rbp - 1024], 123
0x62,0xf3,0x7f,0x28,0x66,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b
-# ATT: vfpclasspbf16y $123, 4064(%rcx), %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, ymmword ptr [rcx + 4064], 123
+# ATT: vfpclassbf16y $123, 4064(%rcx), %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, ymmword ptr [rcx + 4064], 123
0x62,0xf3,0x7f,0x2f,0x66,0x69,0x7f,0x7b
-# ATT: vfpclasspbf16 $123, -256(%rdx){1to16}, %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to16}, 123
+# ATT: vfpclassbf16 $123, -256(%rdx){1to16}, %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to16}, 123
0x62,0xf3,0x7f,0x3f,0x66,0x6a,0x80,0x7b
-# ATT: vfpclasspbf16 $123, (%rip){1to32}, %k5
-# INTEL: vfpclasspbf16 k5, word ptr [rip]{1to32}, 123
+# ATT: vfpclassbf16 $123, (%rip){1to32}, %k5
+# INTEL: vfpclassbf16 k5, word ptr [rip]{1to32}, 123
0x62,0xf3,0x7f,0x58,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b
-# ATT: vfpclasspbf16z $123, -2048(,%rbp,2), %k5
-# INTEL: vfpclasspbf16 k5, zmmword ptr [2*rbp - 2048], 123
+# ATT: vfpclassbf16z $123, -2048(,%rbp,2), %k5
+# INTEL: vfpclassbf16 k5, zmmword ptr [2*rbp - 2048], 123
0x62,0xf3,0x7f,0x48,0x66,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b
-# ATT: vfpclasspbf16z $123, 8128(%rcx), %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, zmmword ptr [rcx + 8128], 123
+# ATT: vfpclassbf16z $123, 8128(%rcx), %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, zmmword ptr [rcx + 8128], 123
0x62,0xf3,0x7f,0x4f,0x66,0x69,0x7f,0x7b
-# ATT: vfpclasspbf16 $123, -256(%rdx){1to32}, %k5 {%k7}
-# INTEL: vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to32}, 123
+# ATT: vfpclassbf16 $123, -256(%rdx){1to32}, %k5 {%k7}
+# INTEL: vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to32}, 123
0x62,0xf3,0x7f,0x5f,0x66,0x6a,0x80,0x7b
-# ATT: vgetexppbf16 %xmm23, %xmm22
-# INTEL: vgetexppbf16 xmm22, xmm23
+# ATT: vgetexpbf16 %xmm23, %xmm22
+# INTEL: vgetexpbf16 xmm22, xmm23
0x62,0xa5,0x7d,0x08,0x42,0xf7
-# ATT: vgetexppbf16 %xmm23, %xmm22 {%k7}
-# INTEL: vgetexppbf16 xmm22 {k7}, xmm23
+# ATT: vgetexpbf16 %xmm23, %xmm22 {%k7}
+# INTEL: vgetexpbf16 xmm22 {k7}, xmm23
0x62,0xa5,0x7d,0x0f,0x42,0xf7
-# ATT: vgetexppbf16 %xmm23, %xmm22 {%k7} {z}
-# INTEL: vgetexppbf16 xmm22 {k7} {z}, xmm23
+# ATT: vgetexpbf16 %xmm23, %xmm22 {%k7} {z}
+# INTEL: vgetexpbf16 xmm22 {k7} {z}, xmm23
0x62,0xa5,0x7d,0x8f,0x42,0xf7
-# ATT: vgetexppbf16 %zmm23, %zmm22
-# INTEL: vgetexppbf16 zmm22, zmm23
+# ATT: vgetexpbf16 %zmm23, %zmm22
+# INTEL: vgetexpbf16 zmm22, zmm23
0x62,0xa5,0x7d,0x48,0x42,0xf7
-# ATT: vgetexppbf16 %zmm23, %zmm22 {%k7}
-# INTEL: vgetexppbf16 zmm22 {k7}, zmm23
+# ATT: vgetexpbf16 %zmm23, %zmm22 {%k7}
+# INTEL: vgetexpbf16 zmm22 {k7}, zmm23
0x62,0xa5,0x7d,0x4f,0x42,0xf7
-# ATT: vgetexppbf16 %zmm23, %zmm22 {%k7} {z}
-# INTEL: vgetexppbf16 zmm22 {k7} {z}, zmm23
+# ATT: vgetexpbf16 %zmm23, %zmm22 {%k7} {z}
+# INTEL: vgetexpbf16 zmm22 {k7} {z}, zmm23
0x62,0xa5,0x7d,0xcf,0x42,0xf7
-# ATT: vgetexppbf16 %ymm23, %ymm22
-# INTEL: vgetexppbf16 ymm22, ymm23
+# ATT: vgetexpbf16 %ymm23, %ymm22
+# INTEL: vgetexpbf16 ymm22, ymm23
0x62,0xa5,0x7d,0x28,0x42,0xf7
-# ATT: vgetexppbf16 %ymm23, %ymm22 {%k7}
-# INTEL: vgetexppbf16 ymm22 {k7}, ymm23
+# ATT: vgetexpbf16 %ymm23, %ymm22 {%k7}
+# INTEL: vgetexpbf16 ymm22 {k7}, ymm23
0x62,0xa5,0x7d,0x2f,0x42,0xf7
-# ATT: vgetexppbf16 %ymm23, %ymm22 {%k7} {z}
-# INTEL: vgetexppbf16 ymm22 {k7} {z}, ymm23
+# ATT: vgetexpbf16 %ymm23, %ymm22 {%k7} {z}
+# INTEL: vgetexpbf16 ymm22 {k7} {z}, ymm23
0x62,0xa5,0x7d,0xaf,0x42,0xf7
-# ATT: vgetexppbf16 268435456(%rbp,%r14,8), %xmm22
-# INTEL: vgetexppbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vgetexpbf16 268435456(%rbp,%r14,8), %xmm22
+# INTEL: vgetexpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x7d,0x08,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vgetexppbf16 291(%r8,%rax,4), %xmm22 {%k7}
-# INTEL: vgetexppbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vgetexpbf16 291(%r8,%rax,4), %xmm22 {%k7}
+# INTEL: vgetexpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x7d,0x0f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vgetexppbf16 (%rip){1to8}, %xmm22
-# INTEL: vgetexppbf16 xmm22, word ptr [rip]{1to8}
+# ATT: vgetexpbf16 (%rip){1to8}, %xmm22
+# INTEL: vgetexpbf16 xmm22, word ptr [rip]{1to8}
0x62,0xe5,0x7d,0x18,0x42,0x35,0x00,0x00,0x00,0x00
-# ATT: vgetexppbf16 -512(,%rbp,2), %xmm22
-# INTEL: vgetexppbf16 xmm22, xmmword ptr [2*rbp - 512]
+# ATT: vgetexpbf16 -512(,%rbp,2), %xmm22
+# INTEL: vgetexpbf16 xmm22, xmmword ptr [2*rbp - 512]
0x62,0xe5,0x7d,0x08,0x42,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vgetexppbf16 2032(%rcx), %xmm22 {%k7} {z}
-# INTEL: vgetexppbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
+# ATT: vgetexpbf16 2032(%rcx), %xmm22 {%k7} {z}
+# INTEL: vgetexpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
0x62,0xe5,0x7d,0x8f,0x42,0x71,0x7f
-# ATT: vgetexppbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
-# INTEL: vgetexppbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
+# ATT: vgetexpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
+# INTEL: vgetexpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
0x62,0xe5,0x7d,0x9f,0x42,0x72,0x80
-# ATT: vgetexppbf16 268435456(%rbp,%r14,8), %ymm22
-# INTEL: vgetexppbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vgetexpbf16 268435456(%rbp,%r14,8), %ymm22
+# INTEL: vgetexpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x7d,0x28,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vgetexppbf16 291(%r8,%rax,4), %ymm22 {%k7}
-# INTEL: vgetexppbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vgetexpbf16 291(%r8,%rax,4), %ymm22 {%k7}
+# INTEL: vgetexpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x7d,0x2f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vgetexppbf16 (%rip){1to16}, %ymm22
-# INTEL: vgetexppbf16 ymm22, word ptr [rip]{1to16}
+# ATT: vgetexpbf16 (%rip){1to16}, %ymm22
+# INTEL: vgetexpbf16 ymm22, word ptr [rip]{1to16}
0x62,0xe5,0x7d,0x38,0x42,0x35,0x00,0x00,0x00,0x00
-# ATT: vgetexppbf16 -1024(,%rbp,2), %ymm22
-# INTEL: vgetexppbf16 ymm22, ymmword ptr [2*rbp - 1024]
+# ATT: vgetexpbf16 -1024(,%rbp,2), %ymm22
+# INTEL: vgetexpbf16 ymm22, ymmword ptr [2*rbp - 1024]
0x62,0xe5,0x7d,0x28,0x42,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vgetexppbf16 4064(%rcx), %ymm22 {%k7} {z}
-# INTEL: vgetexppbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
+# ATT: vgetexpbf16 4064(%rcx), %ymm22 {%k7} {z}
+# INTEL: vgetexpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
0x62,0xe5,0x7d,0xaf,0x42,0x71,0x7f
-# ATT: vgetexppbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
-# INTEL: vgetexppbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
+# ATT: vgetexpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
+# INTEL: vgetexpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
0x62,0xe5,0x7d,0xbf,0x42,0x72,0x80
-# ATT: vgetexppbf16 268435456(%rbp,%r14,8), %zmm22
-# INTEL: vgetexppbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vgetexpbf16 268435456(%rbp,%r14,8), %zmm22
+# INTEL: vgetexpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x7d,0x48,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vgetexppbf16 291(%r8,%rax,4), %zmm22 {%k7}
-# INTEL: vgetexppbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vgetexpbf16 291(%r8,%rax,4), %zmm22 {%k7}
+# INTEL: vgetexpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x7d,0x4f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vgetexppbf16 (%rip){1to32}, %zmm22
-# INTEL: vgetexppbf16 zmm22, word ptr [rip]{1to32}
+# ATT: vgetexpbf16 (%rip){1to32}, %zmm22
+# INTEL: vgetexpbf16 zmm22, word ptr [rip]{1to32}
0x62,0xe5,0x7d,0x58,0x42,0x35,0x00,0x00,0x00,0x00
-# ATT: vgetexppbf16 -2048(,%rbp,2), %zmm22
-# INTEL: vgetexppbf16 zmm22, zmmword ptr [2*rbp - 2048]
+# ATT: vgetexpbf16 -2048(,%rbp,2), %zmm22
+# INTEL: vgetexpbf16 zmm22, zmmword ptr [2*rbp - 2048]
0x62,0xe5,0x7d,0x48,0x42,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vgetexppbf16 8128(%rcx), %zmm22 {%k7} {z}
-# INTEL: vgetexppbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
+# ATT: vgetexpbf16 8128(%rcx), %zmm22 {%k7} {z}
+# INTEL: vgetexpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
0x62,0xe5,0x7d,0xcf,0x42,0x71,0x7f
-# ATT: vgetexppbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
-# INTEL: vgetexppbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
+# ATT: vgetexpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
+# INTEL: vgetexpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
0x62,0xe5,0x7d,0xdf,0x42,0x72,0x80
-# ATT: vgetmantpbf16 $123, %zmm23, %zmm22
-# INTEL: vgetmantpbf16 zmm22, zmm23, 123
+# ATT: vgetmantbf16 $123, %zmm23, %zmm22
+# INTEL: vgetmantbf16 zmm22, zmm23, 123
0x62,0xa3,0x7f,0x48,0x26,0xf7,0x7b
-# ATT: vgetmantpbf16 $123, %zmm23, %zmm22 {%k7}
-# INTEL: vgetmantpbf16 zmm22 {k7}, zmm23, 123
+# ATT: vgetmantbf16 $123, %zmm23, %zmm22 {%k7}
+# INTEL: vgetmantbf16 zmm22 {k7}, zmm23, 123
0x62,0xa3,0x7f,0x4f,0x26,0xf7,0x7b
-# ATT: vgetmantpbf16 $123, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vgetmantpbf16 zmm22 {k7} {z}, zmm23, 123
+# ATT: vgetmantbf16 $123, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vgetmantbf16 zmm22 {k7} {z}, zmm23, 123
0x62,0xa3,0x7f,0xcf,0x26,0xf7,0x7b
-# ATT: vgetmantpbf16 $123, %ymm23, %ymm22
-# INTEL: vgetmantpbf16 ymm22, ymm23, 123
+# ATT: vgetmantbf16 $123, %ymm23, %ymm22
+# INTEL: vgetmantbf16 ymm22, ymm23, 123
0x62,0xa3,0x7f,0x28,0x26,0xf7,0x7b
-# ATT: vgetmantpbf16 $123, %ymm23, %ymm22 {%k7}
-# INTEL: vgetmantpbf16 ymm22 {k7}, ymm23, 123
+# ATT: vgetmantbf16 $123, %ymm23, %ymm22 {%k7}
+# INTEL: vgetmantbf16 ymm22 {k7}, ymm23, 123
0x62,0xa3,0x7f,0x2f,0x26,0xf7,0x7b
-# ATT: vgetmantpbf16 $123, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vgetmantpbf16 ymm22 {k7} {z}, ymm23, 123
+# ATT: vgetmantbf16 $123, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vgetmantbf16 ymm22 {k7} {z}, ymm23, 123
0x62,0xa3,0x7f,0xaf,0x26,0xf7,0x7b
-# ATT: vgetmantpbf16 $123, %xmm23, %xmm22
-# INTEL: vgetmantpbf16 xmm22, xmm23, 123
+# ATT: vgetmantbf16 $123, %xmm23, %xmm22
+# INTEL: vgetmantbf16 xmm22, xmm23, 123
0x62,0xa3,0x7f,0x08,0x26,0xf7,0x7b
-# ATT: vgetmantpbf16 $123, %xmm23, %xmm22 {%k7}
-# INTEL: vgetmantpbf16 xmm22 {k7}, xmm23, 123
+# ATT: vgetmantbf16 $123, %xmm23, %xmm22 {%k7}
+# INTEL: vgetmantbf16 xmm22 {k7}, xmm23, 123
0x62,0xa3,0x7f,0x0f,0x26,0xf7,0x7b
-# ATT: vgetmantpbf16 $123, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vgetmantpbf16 xmm22 {k7} {z}, xmm23, 123
+# ATT: vgetmantbf16 $123, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vgetmantbf16 xmm22 {k7} {z}, xmm23, 123
0x62,0xa3,0x7f,0x8f,0x26,0xf7,0x7b
-# ATT: vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %xmm22
-# INTEL: vgetmantpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
+# ATT: vgetmantbf16 $123, 268435456(%rbp,%r14,8), %xmm22
+# INTEL: vgetmantbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
0x62,0xa3,0x7f,0x08,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b
-# ATT: vgetmantpbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
-# INTEL: vgetmantpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
+# ATT: vgetmantbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
+# INTEL: vgetmantbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
0x62,0xc3,0x7f,0x0f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b
-# ATT: vgetmantpbf16 $123, (%rip){1to8}, %xmm22
-# INTEL: vgetmantpbf16 xmm22, word ptr [rip]{1to8}, 123
+# ATT: vgetmantbf16 $123, (%rip){1to8}, %xmm22
+# INTEL: vgetmantbf16 xmm22, word ptr [rip]{1to8}, 123
0x62,0xe3,0x7f,0x18,0x26,0x35,0x00,0x00,0x00,0x00,0x7b
-# ATT: vgetmantpbf16 $123, -512(,%rbp,2), %xmm22
-# INTEL: vgetmantpbf16 xmm22, xmmword ptr [2*rbp - 512], 123
+# ATT: vgetmantbf16 $123, -512(,%rbp,2), %xmm22
+# INTEL: vgetmantbf16 xmm22, xmmword ptr [2*rbp - 512], 123
0x62,0xe3,0x7f,0x08,0x26,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b
-# ATT: vgetmantpbf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
-# INTEL: vgetmantpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
+# ATT: vgetmantbf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
+# INTEL: vgetmantbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
0x62,0xe3,0x7f,0x8f,0x26,0x71,0x7f,0x7b
-# ATT: vgetmantpbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
-# INTEL: vgetmantpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
+# ATT: vgetmantbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
+# INTEL: vgetmantbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
0x62,0xe3,0x7f,0x9f,0x26,0x72,0x80,0x7b
-# ATT: vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %ymm22
-# INTEL: vgetmantpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
+# ATT: vgetmantbf16 $123, 268435456(%rbp,%r14,8), %ymm22
+# INTEL: vgetmantbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
0x62,0xa3,0x7f,0x28,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b
-# ATT: vgetmantpbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
-# INTEL: vgetmantpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
+# ATT: vgetmantbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
+# INTEL: vgetmantbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
0x62,0xc3,0x7f,0x2f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b
-# ATT: vgetmantpbf16 $123, (%rip){1to16}, %ymm22
-# INTEL: vgetmantpbf16 ymm22, word ptr [rip]{1to16}, 123
+# ATT: vgetmantbf16 $123, (%rip){1to16}, %ymm22
+# INTEL: vgetmantbf16 ymm22, word ptr [rip]{1to16}, 123
0x62,0xe3,0x7f,0x38,0x26,0x35,0x00,0x00,0x00,0x00,0x7b
-# ATT: vgetmantpbf16 $123, -1024(,%rbp,2), %ymm22
-# INTEL: vgetmantpbf16 ymm22, ymmword ptr [2*rbp - 1024], 123
+# ATT: vgetmantbf16 $123, -1024(,%rbp,2), %ymm22
+# INTEL: vgetmantbf16 ymm22, ymmword ptr [2*rbp - 1024], 123
0x62,0xe3,0x7f,0x28,0x26,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b
-# ATT: vgetmantpbf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
-# INTEL: vgetmantpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
+# ATT: vgetmantbf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
+# INTEL: vgetmantbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
0x62,0xe3,0x7f,0xaf,0x26,0x71,0x7f,0x7b
-# ATT: vgetmantpbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
-# INTEL: vgetmantpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
+# ATT: vgetmantbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
+# INTEL: vgetmantbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
0x62,0xe3,0x7f,0xbf,0x26,0x72,0x80,0x7b
-# ATT: vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %zmm22
-# INTEL: vgetmantpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
+# ATT: vgetmantbf16 $123, 268435456(%rbp,%r14,8), %zmm22
+# INTEL: vgetmantbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
0x62,0xa3,0x7f,0x48,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b
-# ATT: vgetmantpbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
-# INTEL: vgetmantpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
+# ATT: vgetmantbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
+# INTEL: vgetmantbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
0x62,0xc3,0x7f,0x4f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b
-# ATT: vgetmantpbf16 $123, (%rip){1to32}, %zmm22
-# INTEL: vgetmantpbf16 zmm22, word ptr [rip]{1to32}, 123
+# ATT: vgetmantbf16 $123, (%rip){1to32}, %zmm22
+# INTEL: vgetmantbf16 zmm22, word ptr [rip]{1to32}, 123
0x62,0xe3,0x7f,0x58,0x26,0x35,0x00,0x00,0x00,0x00,0x7b
-# ATT: vgetmantpbf16 $123, -2048(,%rbp,2), %zmm22
-# INTEL: vgetmantpbf16 zmm22, zmmword ptr [2*rbp - 2048], 123
+# ATT: vgetmantbf16 $123, -2048(,%rbp,2), %zmm22
+# INTEL: vgetmantbf16 zmm22, zmmword ptr [2*rbp - 2048], 123
0x62,0xe3,0x7f,0x48,0x26,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b
-# ATT: vgetmantpbf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
-# INTEL: vgetmantpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
+# ATT: vgetmantbf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
+# INTEL: vgetmantbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
0x62,0xe3,0x7f,0xcf,0x26,0x71,0x7f,0x7b
-# ATT: vgetmantpbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
-# INTEL: vgetmantpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
+# ATT: vgetmantbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
+# INTEL: vgetmantbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
0x62,0xe3,0x7f,0xdf,0x26,0x72,0x80,0x7b
-# ATT: vmaxpbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vmaxpbf16 ymm22, ymm23, ymm24
+# ATT: vmaxbf16 %ymm24, %ymm23, %ymm22
+# INTEL: vmaxbf16 ymm22, ymm23, ymm24
0x62,0x85,0x45,0x20,0x5f,0xf0
-# ATT: vmaxpbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vmaxpbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vmaxbf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vmaxbf16 ymm22 {k7}, ymm23, ymm24
0x62,0x85,0x45,0x27,0x5f,0xf0
-# ATT: vmaxpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vmaxpbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vmaxbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vmaxbf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x85,0x45,0xa7,0x5f,0xf0
-# ATT: vmaxpbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vmaxpbf16 zmm22, zmm23, zmm24
+# ATT: vmaxbf16 %zmm24, %zmm23, %zmm22
+# INTEL: vmaxbf16 zmm22, zmm23, zmm24
0x62,0x85,0x45,0x40,0x5f,0xf0
-# ATT: vmaxpbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vmaxpbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vmaxbf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vmaxbf16 zmm22 {k7}, zmm23, zmm24
0x62,0x85,0x45,0x47,0x5f,0xf0
-# ATT: vmaxpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vmaxpbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vmaxbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vmaxbf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x85,0x45,0xc7,0x5f,0xf0
-# ATT: vmaxpbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vmaxpbf16 xmm22, xmm23, xmm24
+# ATT: vmaxbf16 %xmm24, %xmm23, %xmm22
+# INTEL: vmaxbf16 xmm22, xmm23, xmm24
0x62,0x85,0x45,0x00,0x5f,0xf0
-# ATT: vmaxpbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vmaxpbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vmaxbf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vmaxbf16 xmm22 {k7}, xmm23, xmm24
0x62,0x85,0x45,0x07,0x5f,0xf0
-# ATT: vmaxpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vmaxpbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vmaxbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vmaxbf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x85,0x45,0x87,0x5f,0xf0
-# ATT: vmaxpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vmaxpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vmaxbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vmaxbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x40,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vmaxpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vmaxpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vmaxbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vmaxbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x47,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vmaxpbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vmaxpbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vmaxbf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vmaxbf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe5,0x45,0x50,0x5f,0x35,0x00,0x00,0x00,0x00
-# ATT: vmaxpbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vmaxpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vmaxbf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vmaxbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe5,0x45,0x40,0x5f,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vmaxpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vmaxpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vmaxbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vmaxbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe5,0x45,0xc7,0x5f,0x71,0x7f
-# ATT: vmaxpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vmaxpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vmaxbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vmaxbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe5,0x45,0xd7,0x5f,0x72,0x80
-# ATT: vmaxpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vmaxpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vmaxbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vmaxbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x20,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vmaxpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vmaxpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vmaxbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vmaxbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x27,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vmaxpbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vmaxpbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vmaxbf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vmaxbf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe5,0x45,0x30,0x5f,0x35,0x00,0x00,0x00,0x00
-# ATT: vmaxpbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vmaxpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vmaxbf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vmaxbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe5,0x45,0x20,0x5f,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vmaxpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vmaxpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vmaxbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vmaxbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe5,0x45,0xa7,0x5f,0x71,0x7f
-# ATT: vmaxpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vmaxpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vmaxbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vmaxbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe5,0x45,0xb7,0x5f,0x72,0x80
-# ATT: vmaxpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vmaxpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vmaxbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vmaxbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x00,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vmaxpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vmaxpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vmaxbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vmaxbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x07,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vmaxpbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vmaxpbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vmaxbf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vmaxbf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe5,0x45,0x10,0x5f,0x35,0x00,0x00,0x00,0x00
-# ATT: vmaxpbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vmaxpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vmaxbf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vmaxbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe5,0x45,0x00,0x5f,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vmaxpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vmaxpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vmaxbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vmaxbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe5,0x45,0x87,0x5f,0x71,0x7f
-# ATT: vmaxpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vmaxpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vmaxbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vmaxbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe5,0x45,0x97,0x5f,0x72,0x80
-# ATT: vminpbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vminpbf16 ymm22, ymm23, ymm24
+# ATT: vminbf16 %ymm24, %ymm23, %ymm22
+# INTEL: vminbf16 ymm22, ymm23, ymm24
0x62,0x85,0x45,0x20,0x5d,0xf0
-# ATT: vminpbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vminpbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vminbf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vminbf16 ymm22 {k7}, ymm23, ymm24
0x62,0x85,0x45,0x27,0x5d,0xf0
-# ATT: vminpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vminpbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vminbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vminbf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x85,0x45,0xa7,0x5d,0xf0
-# ATT: vminpbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vminpbf16 zmm22, zmm23, zmm24
+# ATT: vminbf16 %zmm24, %zmm23, %zmm22
+# INTEL: vminbf16 zmm22, zmm23, zmm24
0x62,0x85,0x45,0x40,0x5d,0xf0
-# ATT: vminpbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vminpbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vminbf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vminbf16 zmm22 {k7}, zmm23, zmm24
0x62,0x85,0x45,0x47,0x5d,0xf0
-# ATT: vminpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vminpbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vminbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vminbf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x85,0x45,0xc7,0x5d,0xf0
-# ATT: vminpbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vminpbf16 xmm22, xmm23, xmm24
+# ATT: vminbf16 %xmm24, %xmm23, %xmm22
+# INTEL: vminbf16 xmm22, xmm23, xmm24
0x62,0x85,0x45,0x00,0x5d,0xf0
-# ATT: vminpbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vminpbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vminbf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vminbf16 xmm22 {k7}, xmm23, xmm24
0x62,0x85,0x45,0x07,0x5d,0xf0
-# ATT: vminpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vminpbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vminbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vminbf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x85,0x45,0x87,0x5d,0xf0
-# ATT: vminpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vminpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vminbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vminbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x40,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vminpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vminpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vminbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vminbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x47,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vminpbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vminpbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vminbf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vminbf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe5,0x45,0x50,0x5d,0x35,0x00,0x00,0x00,0x00
-# ATT: vminpbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vminpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vminbf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vminbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe5,0x45,0x40,0x5d,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vminpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vminpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vminbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vminbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe5,0x45,0xc7,0x5d,0x71,0x7f
-# ATT: vminpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vminpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vminbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vminbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe5,0x45,0xd7,0x5d,0x72,0x80
-# ATT: vminpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vminpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vminbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vminbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x20,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vminpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vminpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vminbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vminbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x27,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vminpbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vminpbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vminbf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vminbf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe5,0x45,0x30,0x5d,0x35,0x00,0x00,0x00,0x00
-# ATT: vminpbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vminpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vminbf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vminbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe5,0x45,0x20,0x5d,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vminpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vminpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vminbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vminbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe5,0x45,0xa7,0x5d,0x71,0x7f
-# ATT: vminpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vminpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vminbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vminbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe5,0x45,0xb7,0x5d,0x72,0x80
-# ATT: vminpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vminpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vminbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vminbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x00,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vminpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vminpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vminbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vminbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x07,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vminpbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vminpbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vminbf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vminbf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe5,0x45,0x10,0x5d,0x35,0x00,0x00,0x00,0x00
-# ATT: vminpbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vminpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vminbf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vminbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe5,0x45,0x00,0x5d,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vminpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vminpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vminbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vminbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe5,0x45,0x87,0x5d,0x71,0x7f
-# ATT: vminpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vminpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vminbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vminbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe5,0x45,0x97,0x5d,0x72,0x80
-# ATT: vmulnepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vmulnepbf16 ymm22, ymm23, ymm24
+# ATT: vmulbf16 %ymm24, %ymm23, %ymm22
+# INTEL: vmulbf16 ymm22, ymm23, ymm24
0x62,0x85,0x45,0x20,0x59,0xf0
-# ATT: vmulnepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vmulnepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vmulbf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vmulbf16 ymm22 {k7}, ymm23, ymm24
0x62,0x85,0x45,0x27,0x59,0xf0
-# ATT: vmulnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vmulnepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vmulbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vmulbf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x85,0x45,0xa7,0x59,0xf0
-# ATT: vmulnepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vmulnepbf16 zmm22, zmm23, zmm24
+# ATT: vmulbf16 %zmm24, %zmm23, %zmm22
+# INTEL: vmulbf16 zmm22, zmm23, zmm24
0x62,0x85,0x45,0x40,0x59,0xf0
-# ATT: vmulnepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vmulnepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vmulbf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vmulbf16 zmm22 {k7}, zmm23, zmm24
0x62,0x85,0x45,0x47,0x59,0xf0
-# ATT: vmulnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vmulnepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vmulbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vmulbf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x85,0x45,0xc7,0x59,0xf0
-# ATT: vmulnepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vmulnepbf16 xmm22, xmm23, xmm24
+# ATT: vmulbf16 %xmm24, %xmm23, %xmm22
+# INTEL: vmulbf16 xmm22, xmm23, xmm24
0x62,0x85,0x45,0x00,0x59,0xf0
-# ATT: vmulnepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vmulnepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vmulbf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vmulbf16 xmm22 {k7}, xmm23, xmm24
0x62,0x85,0x45,0x07,0x59,0xf0
-# ATT: vmulnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vmulnepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vmulbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vmulbf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x85,0x45,0x87,0x59,0xf0
-# ATT: vmulnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vmulnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vmulbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vmulbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x40,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vmulnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vmulnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vmulbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vmulbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x47,0x59,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vmulnepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vmulnepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vmulbf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vmulbf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe5,0x45,0x50,0x59,0x35,0x00,0x00,0x00,0x00
-# ATT: vmulnepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vmulnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vmulbf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vmulbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe5,0x45,0x40,0x59,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vmulnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vmulnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vmulbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vmulbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe5,0x45,0xc7,0x59,0x71,0x7f
-# ATT: vmulnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vmulnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vmulbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vmulbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe5,0x45,0xd7,0x59,0x72,0x80
-# ATT: vmulnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vmulnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vmulbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vmulbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x20,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vmulnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vmulnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vmulbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vmulbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x27,0x59,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vmulnepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vmulnepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vmulbf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vmulbf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe5,0x45,0x30,0x59,0x35,0x00,0x00,0x00,0x00
-# ATT: vmulnepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vmulnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vmulbf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vmulbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe5,0x45,0x20,0x59,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vmulnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vmulnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vmulbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vmulbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe5,0x45,0xa7,0x59,0x71,0x7f
-# ATT: vmulnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vmulnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vmulbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vmulbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe5,0x45,0xb7,0x59,0x72,0x80
-# ATT: vmulnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vmulnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vmulbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vmulbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x00,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vmulnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vmulnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vmulbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vmulbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x07,0x59,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vmulnepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vmulnepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vmulbf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vmulbf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe5,0x45,0x10,0x59,0x35,0x00,0x00,0x00,0x00
-# ATT: vmulnepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vmulnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vmulbf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vmulbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe5,0x45,0x00,0x59,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vmulnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vmulnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vmulbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vmulbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe5,0x45,0x87,0x59,0x71,0x7f
-# ATT: vmulnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vmulnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vmulbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vmulbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe5,0x45,0x97,0x59,0x72,0x80
-# ATT: vrcppbf16 %xmm23, %xmm22
-# INTEL: vrcppbf16 xmm22, xmm23
+# ATT: vrcpbf16 %xmm23, %xmm22
+# INTEL: vrcpbf16 xmm22, xmm23
0x62,0xa6,0x7c,0x08,0x4c,0xf7
-# ATT: vrcppbf16 %xmm23, %xmm22 {%k7}
-# INTEL: vrcppbf16 xmm22 {k7}, xmm23
+# ATT: vrcpbf16 %xmm23, %xmm22 {%k7}
+# INTEL: vrcpbf16 xmm22 {k7}, xmm23
0x62,0xa6,0x7c,0x0f,0x4c,0xf7
-# ATT: vrcppbf16 %xmm23, %xmm22 {%k7} {z}
-# INTEL: vrcppbf16 xmm22 {k7} {z}, xmm23
+# ATT: vrcpbf16 %xmm23, %xmm22 {%k7} {z}
+# INTEL: vrcpbf16 xmm22 {k7} {z}, xmm23
0x62,0xa6,0x7c,0x8f,0x4c,0xf7
-# ATT: vrcppbf16 %zmm23, %zmm22
-# INTEL: vrcppbf16 zmm22, zmm23
+# ATT: vrcpbf16 %zmm23, %zmm22
+# INTEL: vrcpbf16 zmm22, zmm23
0x62,0xa6,0x7c,0x48,0x4c,0xf7
-# ATT: vrcppbf16 %zmm23, %zmm22 {%k7}
-# INTEL: vrcppbf16 zmm22 {k7}, zmm23
+# ATT: vrcpbf16 %zmm23, %zmm22 {%k7}
+# INTEL: vrcpbf16 zmm22 {k7}, zmm23
0x62,0xa6,0x7c,0x4f,0x4c,0xf7
-# ATT: vrcppbf16 %zmm23, %zmm22 {%k7} {z}
-# INTEL: vrcppbf16 zmm22 {k7} {z}, zmm23
+# ATT: vrcpbf16 %zmm23, %zmm22 {%k7} {z}
+# INTEL: vrcpbf16 zmm22 {k7} {z}, zmm23
0x62,0xa6,0x7c,0xcf,0x4c,0xf7
-# ATT: vrcppbf16 %ymm23, %ymm22
-# INTEL: vrcppbf16 ymm22, ymm23
+# ATT: vrcpbf16 %ymm23, %ymm22
+# INTEL: vrcpbf16 ymm22, ymm23
0x62,0xa6,0x7c,0x28,0x4c,0xf7
-# ATT: vrcppbf16 %ymm23, %ymm22 {%k7}
-# INTEL: vrcppbf16 ymm22 {k7}, ymm23
+# ATT: vrcpbf16 %ymm23, %ymm22 {%k7}
+# INTEL: vrcpbf16 ymm22 {k7}, ymm23
0x62,0xa6,0x7c,0x2f,0x4c,0xf7
-# ATT: vrcppbf16 %ymm23, %ymm22 {%k7} {z}
-# INTEL: vrcppbf16 ymm22 {k7} {z}, ymm23
+# ATT: vrcpbf16 %ymm23, %ymm22 {%k7} {z}
+# INTEL: vrcpbf16 ymm22 {k7} {z}, ymm23
0x62,0xa6,0x7c,0xaf,0x4c,0xf7
-# ATT: vrcppbf16 268435456(%rbp,%r14,8), %xmm22
-# INTEL: vrcppbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vrcpbf16 268435456(%rbp,%r14,8), %xmm22
+# INTEL: vrcpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x7c,0x08,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vrcppbf16 291(%r8,%rax,4), %xmm22 {%k7}
-# INTEL: vrcppbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vrcpbf16 291(%r8,%rax,4), %xmm22 {%k7}
+# INTEL: vrcpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x7c,0x0f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vrcppbf16 (%rip){1to8}, %xmm22
-# INTEL: vrcppbf16 xmm22, word ptr [rip]{1to8}
+# ATT: vrcpbf16 (%rip){1to8}, %xmm22
+# INTEL: vrcpbf16 xmm22, word ptr [rip]{1to8}
0x62,0xe6,0x7c,0x18,0x4c,0x35,0x00,0x00,0x00,0x00
-# ATT: vrcppbf16 -512(,%rbp,2), %xmm22
-# INTEL: vrcppbf16 xmm22, xmmword ptr [2*rbp - 512]
+# ATT: vrcpbf16 -512(,%rbp,2), %xmm22
+# INTEL: vrcpbf16 xmm22, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x7c,0x08,0x4c,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vrcppbf16 2032(%rcx), %xmm22 {%k7} {z}
-# INTEL: vrcppbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
+# ATT: vrcpbf16 2032(%rcx), %xmm22 {%k7} {z}
+# INTEL: vrcpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
0x62,0xe6,0x7c,0x8f,0x4c,0x71,0x7f
-# ATT: vrcppbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
-# INTEL: vrcppbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
+# ATT: vrcpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
+# INTEL: vrcpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x7c,0x9f,0x4c,0x72,0x80
-# ATT: vrcppbf16 268435456(%rbp,%r14,8), %ymm22
-# INTEL: vrcppbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vrcpbf16 268435456(%rbp,%r14,8), %ymm22
+# INTEL: vrcpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x7c,0x28,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vrcppbf16 291(%r8,%rax,4), %ymm22 {%k7}
-# INTEL: vrcppbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vrcpbf16 291(%r8,%rax,4), %ymm22 {%k7}
+# INTEL: vrcpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x7c,0x2f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vrcppbf16 (%rip){1to16}, %ymm22
-# INTEL: vrcppbf16 ymm22, word ptr [rip]{1to16}
+# ATT: vrcpbf16 (%rip){1to16}, %ymm22
+# INTEL: vrcpbf16 ymm22, word ptr [rip]{1to16}
0x62,0xe6,0x7c,0x38,0x4c,0x35,0x00,0x00,0x00,0x00
-# ATT: vrcppbf16 -1024(,%rbp,2), %ymm22
-# INTEL: vrcppbf16 ymm22, ymmword ptr [2*rbp - 1024]
+# ATT: vrcpbf16 -1024(,%rbp,2), %ymm22
+# INTEL: vrcpbf16 ymm22, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x7c,0x28,0x4c,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vrcppbf16 4064(%rcx), %ymm22 {%k7} {z}
-# INTEL: vrcppbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
+# ATT: vrcpbf16 4064(%rcx), %ymm22 {%k7} {z}
+# INTEL: vrcpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
0x62,0xe6,0x7c,0xaf,0x4c,0x71,0x7f
-# ATT: vrcppbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
-# INTEL: vrcppbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
+# ATT: vrcpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
+# INTEL: vrcpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x7c,0xbf,0x4c,0x72,0x80
-# ATT: vrcppbf16 268435456(%rbp,%r14,8), %zmm22
-# INTEL: vrcppbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vrcpbf16 268435456(%rbp,%r14,8), %zmm22
+# INTEL: vrcpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x7c,0x48,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vrcppbf16 291(%r8,%rax,4), %zmm22 {%k7}
-# INTEL: vrcppbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vrcpbf16 291(%r8,%rax,4), %zmm22 {%k7}
+# INTEL: vrcpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x7c,0x4f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vrcppbf16 (%rip){1to32}, %zmm22
-# INTEL: vrcppbf16 zmm22, word ptr [rip]{1to32}
+# ATT: vrcpbf16 (%rip){1to32}, %zmm22
+# INTEL: vrcpbf16 zmm22, word ptr [rip]{1to32}
0x62,0xe6,0x7c,0x58,0x4c,0x35,0x00,0x00,0x00,0x00
-# ATT: vrcppbf16 -2048(,%rbp,2), %zmm22
-# INTEL: vrcppbf16 zmm22, zmmword ptr [2*rbp - 2048]
+# ATT: vrcpbf16 -2048(,%rbp,2), %zmm22
+# INTEL: vrcpbf16 zmm22, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x7c,0x48,0x4c,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vrcppbf16 8128(%rcx), %zmm22 {%k7} {z}
-# INTEL: vrcppbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
+# ATT: vrcpbf16 8128(%rcx), %zmm22 {%k7} {z}
+# INTEL: vrcpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
0x62,0xe6,0x7c,0xcf,0x4c,0x71,0x7f
-# ATT: vrcppbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
-# INTEL: vrcppbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
+# ATT: vrcpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
+# INTEL: vrcpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x7c,0xdf,0x4c,0x72,0x80
-# ATT: vreducenepbf16 $123, %zmm23, %zmm22
-# INTEL: vreducenepbf16 zmm22, zmm23, 123
+# ATT: vreducebf16 $123, %zmm23, %zmm22
+# INTEL: vreducebf16 zmm22, zmm23, 123
0x62,0xa3,0x7f,0x48,0x56,0xf7,0x7b
-# ATT: vreducenepbf16 $123, %zmm23, %zmm22 {%k7}
-# INTEL: vreducenepbf16 zmm22 {k7}, zmm23, 123
+# ATT: vreducebf16 $123, %zmm23, %zmm22 {%k7}
+# INTEL: vreducebf16 zmm22 {k7}, zmm23, 123
0x62,0xa3,0x7f,0x4f,0x56,0xf7,0x7b
-# ATT: vreducenepbf16 $123, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vreducenepbf16 zmm22 {k7} {z}, zmm23, 123
+# ATT: vreducebf16 $123, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vreducebf16 zmm22 {k7} {z}, zmm23, 123
0x62,0xa3,0x7f,0xcf,0x56,0xf7,0x7b
-# ATT: vreducenepbf16 $123, %ymm23, %ymm22
-# INTEL: vreducenepbf16 ymm22, ymm23, 123
+# ATT: vreducebf16 $123, %ymm23, %ymm22
+# INTEL: vreducebf16 ymm22, ymm23, 123
0x62,0xa3,0x7f,0x28,0x56,0xf7,0x7b
-# ATT: vreducenepbf16 $123, %ymm23, %ymm22 {%k7}
-# INTEL: vreducenepbf16 ymm22 {k7}, ymm23, 123
+# ATT: vreducebf16 $123, %ymm23, %ymm22 {%k7}
+# INTEL: vreducebf16 ymm22 {k7}, ymm23, 123
0x62,0xa3,0x7f,0x2f,0x56,0xf7,0x7b
-# ATT: vreducenepbf16 $123, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vreducenepbf16 ymm22 {k7} {z}, ymm23, 123
+# ATT: vreducebf16 $123, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vreducebf16 ymm22 {k7} {z}, ymm23, 123
0x62,0xa3,0x7f,0xaf,0x56,0xf7,0x7b
-# ATT: vreducenepbf16 $123, %xmm23, %xmm22
-# INTEL: vreducenepbf16 xmm22, xmm23, 123
+# ATT: vreducebf16 $123, %xmm23, %xmm22
+# INTEL: vreducebf16 xmm22, xmm23, 123
0x62,0xa3,0x7f,0x08,0x56,0xf7,0x7b
-# ATT: vreducenepbf16 $123, %xmm23, %xmm22 {%k7}
-# INTEL: vreducenepbf16 xmm22 {k7}, xmm23, 123
+# ATT: vreducebf16 $123, %xmm23, %xmm22 {%k7}
+# INTEL: vreducebf16 xmm22 {k7}, xmm23, 123
0x62,0xa3,0x7f,0x0f,0x56,0xf7,0x7b
-# ATT: vreducenepbf16 $123, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vreducenepbf16 xmm22 {k7} {z}, xmm23, 123
+# ATT: vreducebf16 $123, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vreducebf16 xmm22 {k7} {z}, xmm23, 123
0x62,0xa3,0x7f,0x8f,0x56,0xf7,0x7b
-# ATT: vreducenepbf16 $123, 268435456(%rbp,%r14,8), %xmm22
-# INTEL: vreducenepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
+# ATT: vreducebf16 $123, 268435456(%rbp,%r14,8), %xmm22
+# INTEL: vreducebf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
0x62,0xa3,0x7f,0x08,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b
-# ATT: vreducenepbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
-# INTEL: vreducenepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
+# ATT: vreducebf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
+# INTEL: vreducebf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
0x62,0xc3,0x7f,0x0f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b
-# ATT: vreducenepbf16 $123, (%rip){1to8}, %xmm22
-# INTEL: vreducenepbf16 xmm22, word ptr [rip]{1to8}, 123
+# ATT: vreducebf16 $123, (%rip){1to8}, %xmm22
+# INTEL: vreducebf16 xmm22, word ptr [rip]{1to8}, 123
0x62,0xe3,0x7f,0x18,0x56,0x35,0x00,0x00,0x00,0x00,0x7b
-# ATT: vreducenepbf16 $123, -512(,%rbp,2), %xmm22
-# INTEL: vreducenepbf16 xmm22, xmmword ptr [2*rbp - 512], 123
+# ATT: vreducebf16 $123, -512(,%rbp,2), %xmm22
+# INTEL: vreducebf16 xmm22, xmmword ptr [2*rbp - 512], 123
0x62,0xe3,0x7f,0x08,0x56,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b
-# ATT: vreducenepbf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
-# INTEL: vreducenepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
+# ATT: vreducebf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
+# INTEL: vreducebf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
0x62,0xe3,0x7f,0x8f,0x56,0x71,0x7f,0x7b
-# ATT: vreducenepbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
-# INTEL: vreducenepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
+# ATT: vreducebf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
+# INTEL: vreducebf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
0x62,0xe3,0x7f,0x9f,0x56,0x72,0x80,0x7b
-# ATT: vreducenepbf16 $123, 268435456(%rbp,%r14,8), %ymm22
-# INTEL: vreducenepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
+# ATT: vreducebf16 $123, 268435456(%rbp,%r14,8), %ymm22
+# INTEL: vreducebf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
0x62,0xa3,0x7f,0x28,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b
-# ATT: vreducenepbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
-# INTEL: vreducenepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
+# ATT: vreducebf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
+# INTEL: vreducebf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
0x62,0xc3,0x7f,0x2f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b
-# ATT: vreducenepbf16 $123, (%rip){1to16}, %ymm22
-# INTEL: vreducenepbf16 ymm22, word ptr [rip]{1to16}, 123
+# ATT: vreducebf16 $123, (%rip){1to16}, %ymm22
+# INTEL: vreducebf16 ymm22, word ptr [rip]{1to16}, 123
0x62,0xe3,0x7f,0x38,0x56,0x35,0x00,0x00,0x00,0x00,0x7b
-# ATT: vreducenepbf16 $123, -1024(,%rbp,2), %ymm22
-# INTEL: vreducenepbf16 ymm22, ymmword ptr [2*rbp - 1024], 123
+# ATT: vreducebf16 $123, -1024(,%rbp,2), %ymm22
+# INTEL: vreducebf16 ymm22, ymmword ptr [2*rbp - 1024], 123
0x62,0xe3,0x7f,0x28,0x56,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b
-# ATT: vreducenepbf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
-# INTEL: vreducenepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
+# ATT: vreducebf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
+# INTEL: vreducebf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
0x62,0xe3,0x7f,0xaf,0x56,0x71,0x7f,0x7b
-# ATT: vreducenepbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
-# INTEL: vreducenepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
+# ATT: vreducebf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
+# INTEL: vreducebf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
0x62,0xe3,0x7f,0xbf,0x56,0x72,0x80,0x7b
-# ATT: vreducenepbf16 $123, 268435456(%rbp,%r14,8), %zmm22
-# INTEL: vreducenepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
+# ATT: vreducebf16 $123, 268435456(%rbp,%r14,8), %zmm22
+# INTEL: vreducebf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
0x62,0xa3,0x7f,0x48,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b
-# ATT: vreducenepbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
-# INTEL: vreducenepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
+# ATT: vreducebf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
+# INTEL: vreducebf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
0x62,0xc3,0x7f,0x4f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b
-# ATT: vreducenepbf16 $123, (%rip){1to32}, %zmm22
-# INTEL: vreducenepbf16 zmm22, word ptr [rip]{1to32}, 123
+# ATT: vreducebf16 $123, (%rip){1to32}, %zmm22
+# INTEL: vreducebf16 zmm22, word ptr [rip]{1to32}, 123
0x62,0xe3,0x7f,0x58,0x56,0x35,0x00,0x00,0x00,0x00,0x7b
-# ATT: vreducenepbf16 $123, -2048(,%rbp,2), %zmm22
-# INTEL: vreducenepbf16 zmm22, zmmword ptr [2*rbp - 2048], 123
+# ATT: vreducebf16 $123, -2048(,%rbp,2), %zmm22
+# INTEL: vreducebf16 zmm22, zmmword ptr [2*rbp - 2048], 123
0x62,0xe3,0x7f,0x48,0x56,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b
-# ATT: vreducenepbf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
-# INTEL: vreducenepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
+# ATT: vreducebf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
+# INTEL: vreducebf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
0x62,0xe3,0x7f,0xcf,0x56,0x71,0x7f,0x7b
-# ATT: vreducenepbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
-# INTEL: vreducenepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
+# ATT: vreducebf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
+# INTEL: vreducebf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
0x62,0xe3,0x7f,0xdf,0x56,0x72,0x80,0x7b
-# ATT: vrndscalenepbf16 $123, %zmm23, %zmm22
-# INTEL: vrndscalenepbf16 zmm22, zmm23, 123
+# ATT: vrndscalebf16 $123, %zmm23, %zmm22
+# INTEL: vrndscalebf16 zmm22, zmm23, 123
0x62,0xa3,0x7f,0x48,0x08,0xf7,0x7b
-# ATT: vrndscalenepbf16 $123, %zmm23, %zmm22 {%k7}
-# INTEL: vrndscalenepbf16 zmm22 {k7}, zmm23, 123
+# ATT: vrndscalebf16 $123, %zmm23, %zmm22 {%k7}
+# INTEL: vrndscalebf16 zmm22 {k7}, zmm23, 123
0x62,0xa3,0x7f,0x4f,0x08,0xf7,0x7b
-# ATT: vrndscalenepbf16 $123, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vrndscalenepbf16 zmm22 {k7} {z}, zmm23, 123
+# ATT: vrndscalebf16 $123, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vrndscalebf16 zmm22 {k7} {z}, zmm23, 123
0x62,0xa3,0x7f,0xcf,0x08,0xf7,0x7b
-# ATT: vrndscalenepbf16 $123, %ymm23, %ymm22
-# INTEL: vrndscalenepbf16 ymm22, ymm23, 123
+# ATT: vrndscalebf16 $123, %ymm23, %ymm22
+# INTEL: vrndscalebf16 ymm22, ymm23, 123
0x62,0xa3,0x7f,0x28,0x08,0xf7,0x7b
-# ATT: vrndscalenepbf16 $123, %ymm23, %ymm22 {%k7}
-# INTEL: vrndscalenepbf16 ymm22 {k7}, ymm23, 123
+# ATT: vrndscalebf16 $123, %ymm23, %ymm22 {%k7}
+# INTEL: vrndscalebf16 ymm22 {k7}, ymm23, 123
0x62,0xa3,0x7f,0x2f,0x08,0xf7,0x7b
-# ATT: vrndscalenepbf16 $123, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vrndscalenepbf16 ymm22 {k7} {z}, ymm23, 123
+# ATT: vrndscalebf16 $123, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vrndscalebf16 ymm22 {k7} {z}, ymm23, 123
0x62,0xa3,0x7f,0xaf,0x08,0xf7,0x7b
-# ATT: vrndscalenepbf16 $123, %xmm23, %xmm22
-# INTEL: vrndscalenepbf16 xmm22, xmm23, 123
+# ATT: vrndscalebf16 $123, %xmm23, %xmm22
+# INTEL: vrndscalebf16 xmm22, xmm23, 123
0x62,0xa3,0x7f,0x08,0x08,0xf7,0x7b
-# ATT: vrndscalenepbf16 $123, %xmm23, %xmm22 {%k7}
-# INTEL: vrndscalenepbf16 xmm22 {k7}, xmm23, 123
+# ATT: vrndscalebf16 $123, %xmm23, %xmm22 {%k7}
+# INTEL: vrndscalebf16 xmm22 {k7}, xmm23, 123
0x62,0xa3,0x7f,0x0f,0x08,0xf7,0x7b
-# ATT: vrndscalenepbf16 $123, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vrndscalenepbf16 xmm22 {k7} {z}, xmm23, 123
+# ATT: vrndscalebf16 $123, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vrndscalebf16 xmm22 {k7} {z}, xmm23, 123
0x62,0xa3,0x7f,0x8f,0x08,0xf7,0x7b
-# ATT: vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %xmm22
-# INTEL: vrndscalenepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
+# ATT: vrndscalebf16 $123, 268435456(%rbp,%r14,8), %xmm22
+# INTEL: vrndscalebf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
0x62,0xa3,0x7f,0x08,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b
-# ATT: vrndscalenepbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
-# INTEL: vrndscalenepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
+# ATT: vrndscalebf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
+# INTEL: vrndscalebf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
0x62,0xc3,0x7f,0x0f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b
-# ATT: vrndscalenepbf16 $123, (%rip){1to8}, %xmm22
-# INTEL: vrndscalenepbf16 xmm22, word ptr [rip]{1to8}, 123
+# ATT: vrndscalebf16 $123, (%rip){1to8}, %xmm22
+# INTEL: vrndscalebf16 xmm22, word ptr [rip]{1to8}, 123
0x62,0xe3,0x7f,0x18,0x08,0x35,0x00,0x00,0x00,0x00,0x7b
-# ATT: vrndscalenepbf16 $123, -512(,%rbp,2), %xmm22
-# INTEL: vrndscalenepbf16 xmm22, xmmword ptr [2*rbp - 512], 123
+# ATT: vrndscalebf16 $123, -512(,%rbp,2), %xmm22
+# INTEL: vrndscalebf16 xmm22, xmmword ptr [2*rbp - 512], 123
0x62,0xe3,0x7f,0x08,0x08,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b
-# ATT: vrndscalenepbf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
-# INTEL: vrndscalenepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
+# ATT: vrndscalebf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
+# INTEL: vrndscalebf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
0x62,0xe3,0x7f,0x8f,0x08,0x71,0x7f,0x7b
-# ATT: vrndscalenepbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
-# INTEL: vrndscalenepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
+# ATT: vrndscalebf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
+# INTEL: vrndscalebf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
0x62,0xe3,0x7f,0x9f,0x08,0x72,0x80,0x7b
-# ATT: vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %ymm22
-# INTEL: vrndscalenepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
+# ATT: vrndscalebf16 $123, 268435456(%rbp,%r14,8), %ymm22
+# INTEL: vrndscalebf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
0x62,0xa3,0x7f,0x28,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b
-# ATT: vrndscalenepbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
-# INTEL: vrndscalenepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
+# ATT: vrndscalebf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
+# INTEL: vrndscalebf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
0x62,0xc3,0x7f,0x2f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b
-# ATT: vrndscalenepbf16 $123, (%rip){1to16}, %ymm22
-# INTEL: vrndscalenepbf16 ymm22, word ptr [rip]{1to16}, 123
+# ATT: vrndscalebf16 $123, (%rip){1to16}, %ymm22
+# INTEL: vrndscalebf16 ymm22, word ptr [rip]{1to16}, 123
0x62,0xe3,0x7f,0x38,0x08,0x35,0x00,0x00,0x00,0x00,0x7b
-# ATT: vrndscalenepbf16 $123, -1024(,%rbp,2), %ymm22
-# INTEL: vrndscalenepbf16 ymm22, ymmword ptr [2*rbp - 1024], 123
+# ATT: vrndscalebf16 $123, -1024(,%rbp,2), %ymm22
+# INTEL: vrndscalebf16 ymm22, ymmword ptr [2*rbp - 1024], 123
0x62,0xe3,0x7f,0x28,0x08,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b
-# ATT: vrndscalenepbf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
-# INTEL: vrndscalenepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
+# ATT: vrndscalebf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
+# INTEL: vrndscalebf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
0x62,0xe3,0x7f,0xaf,0x08,0x71,0x7f,0x7b
-# ATT: vrndscalenepbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
-# INTEL: vrndscalenepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
+# ATT: vrndscalebf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
+# INTEL: vrndscalebf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
0x62,0xe3,0x7f,0xbf,0x08,0x72,0x80,0x7b
-# ATT: vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %zmm22
-# INTEL: vrndscalenepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
+# ATT: vrndscalebf16 $123, 268435456(%rbp,%r14,8), %zmm22
+# INTEL: vrndscalebf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
0x62,0xa3,0x7f,0x48,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b
-# ATT: vrndscalenepbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
-# INTEL: vrndscalenepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
+# ATT: vrndscalebf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
+# INTEL: vrndscalebf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
0x62,0xc3,0x7f,0x4f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b
-# ATT: vrndscalenepbf16 $123, (%rip){1to32}, %zmm22
-# INTEL: vrndscalenepbf16 zmm22, word ptr [rip]{1to32}, 123
+# ATT: vrndscalebf16 $123, (%rip){1to32}, %zmm22
+# INTEL: vrndscalebf16 zmm22, word ptr [rip]{1to32}, 123
0x62,0xe3,0x7f,0x58,0x08,0x35,0x00,0x00,0x00,0x00,0x7b
-# ATT: vrndscalenepbf16 $123, -2048(,%rbp,2), %zmm22
-# INTEL: vrndscalenepbf16 zmm22, zmmword ptr [2*rbp - 2048], 123
+# ATT: vrndscalebf16 $123, -2048(,%rbp,2), %zmm22
+# INTEL: vrndscalebf16 zmm22, zmmword ptr [2*rbp - 2048], 123
0x62,0xe3,0x7f,0x48,0x08,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b
-# ATT: vrndscalenepbf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
-# INTEL: vrndscalenepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
+# ATT: vrndscalebf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
+# INTEL: vrndscalebf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
0x62,0xe3,0x7f,0xcf,0x08,0x71,0x7f,0x7b
-# ATT: vrndscalenepbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
-# INTEL: vrndscalenepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
+# ATT: vrndscalebf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
+# INTEL: vrndscalebf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
0x62,0xe3,0x7f,0xdf,0x08,0x72,0x80,0x7b
-# ATT: vrsqrtpbf16 %xmm23, %xmm22
-# INTEL: vrsqrtpbf16 xmm22, xmm23
+# ATT: vrsqrtbf16 %xmm23, %xmm22
+# INTEL: vrsqrtbf16 xmm22, xmm23
0x62,0xa6,0x7c,0x08,0x4e,0xf7
-# ATT: vrsqrtpbf16 %xmm23, %xmm22 {%k7}
-# INTEL: vrsqrtpbf16 xmm22 {k7}, xmm23
+# ATT: vrsqrtbf16 %xmm23, %xmm22 {%k7}
+# INTEL: vrsqrtbf16 xmm22 {k7}, xmm23
0x62,0xa6,0x7c,0x0f,0x4e,0xf7
-# ATT: vrsqrtpbf16 %xmm23, %xmm22 {%k7} {z}
-# INTEL: vrsqrtpbf16 xmm22 {k7} {z}, xmm23
+# ATT: vrsqrtbf16 %xmm23, %xmm22 {%k7} {z}
+# INTEL: vrsqrtbf16 xmm22 {k7} {z}, xmm23
0x62,0xa6,0x7c,0x8f,0x4e,0xf7
-# ATT: vrsqrtpbf16 %zmm23, %zmm22
-# INTEL: vrsqrtpbf16 zmm22, zmm23
+# ATT: vrsqrtbf16 %zmm23, %zmm22
+# INTEL: vrsqrtbf16 zmm22, zmm23
0x62,0xa6,0x7c,0x48,0x4e,0xf7
-# ATT: vrsqrtpbf16 %zmm23, %zmm22 {%k7}
-# INTEL: vrsqrtpbf16 zmm22 {k7}, zmm23
+# ATT: vrsqrtbf16 %zmm23, %zmm22 {%k7}
+# INTEL: vrsqrtbf16 zmm22 {k7}, zmm23
0x62,0xa6,0x7c,0x4f,0x4e,0xf7
-# ATT: vrsqrtpbf16 %zmm23, %zmm22 {%k7} {z}
-# INTEL: vrsqrtpbf16 zmm22 {k7} {z}, zmm23
+# ATT: vrsqrtbf16 %zmm23, %zmm22 {%k7} {z}
+# INTEL: vrsqrtbf16 zmm22 {k7} {z}, zmm23
0x62,0xa6,0x7c,0xcf,0x4e,0xf7
-# ATT: vrsqrtpbf16 %ymm23, %ymm22
-# INTEL: vrsqrtpbf16 ymm22, ymm23
+# ATT: vrsqrtbf16 %ymm23, %ymm22
+# INTEL: vrsqrtbf16 ymm22, ymm23
0x62,0xa6,0x7c,0x28,0x4e,0xf7
-# ATT: vrsqrtpbf16 %ymm23, %ymm22 {%k7}
-# INTEL: vrsqrtpbf16 ymm22 {k7}, ymm23
+# ATT: vrsqrtbf16 %ymm23, %ymm22 {%k7}
+# INTEL: vrsqrtbf16 ymm22 {k7}, ymm23
0x62,0xa6,0x7c,0x2f,0x4e,0xf7
-# ATT: vrsqrtpbf16 %ymm23, %ymm22 {%k7} {z}
-# INTEL: vrsqrtpbf16 ymm22 {k7} {z}, ymm23
+# ATT: vrsqrtbf16 %ymm23, %ymm22 {%k7} {z}
+# INTEL: vrsqrtbf16 ymm22 {k7} {z}, ymm23
0x62,0xa6,0x7c,0xaf,0x4e,0xf7
-# ATT: vrsqrtpbf16 268435456(%rbp,%r14,8), %xmm22
-# INTEL: vrsqrtpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vrsqrtbf16 268435456(%rbp,%r14,8), %xmm22
+# INTEL: vrsqrtbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x7c,0x08,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vrsqrtpbf16 291(%r8,%rax,4), %xmm22 {%k7}
-# INTEL: vrsqrtpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vrsqrtbf16 291(%r8,%rax,4), %xmm22 {%k7}
+# INTEL: vrsqrtbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x7c,0x0f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vrsqrtpbf16 (%rip){1to8}, %xmm22
-# INTEL: vrsqrtpbf16 xmm22, word ptr [rip]{1to8}
+# ATT: vrsqrtbf16 (%rip){1to8}, %xmm22
+# INTEL: vrsqrtbf16 xmm22, word ptr [rip]{1to8}
0x62,0xe6,0x7c,0x18,0x4e,0x35,0x00,0x00,0x00,0x00
-# ATT: vrsqrtpbf16 -512(,%rbp,2), %xmm22
-# INTEL: vrsqrtpbf16 xmm22, xmmword ptr [2*rbp - 512]
+# ATT: vrsqrtbf16 -512(,%rbp,2), %xmm22
+# INTEL: vrsqrtbf16 xmm22, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x7c,0x08,0x4e,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vrsqrtpbf16 2032(%rcx), %xmm22 {%k7} {z}
-# INTEL: vrsqrtpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
+# ATT: vrsqrtbf16 2032(%rcx), %xmm22 {%k7} {z}
+# INTEL: vrsqrtbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
0x62,0xe6,0x7c,0x8f,0x4e,0x71,0x7f
-# ATT: vrsqrtpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
-# INTEL: vrsqrtpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
+# ATT: vrsqrtbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
+# INTEL: vrsqrtbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x7c,0x9f,0x4e,0x72,0x80
-# ATT: vrsqrtpbf16 268435456(%rbp,%r14,8), %ymm22
-# INTEL: vrsqrtpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vrsqrtbf16 268435456(%rbp,%r14,8), %ymm22
+# INTEL: vrsqrtbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x7c,0x28,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vrsqrtpbf16 291(%r8,%rax,4), %ymm22 {%k7}
-# INTEL: vrsqrtpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vrsqrtbf16 291(%r8,%rax,4), %ymm22 {%k7}
+# INTEL: vrsqrtbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x7c,0x2f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vrsqrtpbf16 (%rip){1to16}, %ymm22
-# INTEL: vrsqrtpbf16 ymm22, word ptr [rip]{1to16}
+# ATT: vrsqrtbf16 (%rip){1to16}, %ymm22
+# INTEL: vrsqrtbf16 ymm22, word ptr [rip]{1to16}
0x62,0xe6,0x7c,0x38,0x4e,0x35,0x00,0x00,0x00,0x00
-# ATT: vrsqrtpbf16 -1024(,%rbp,2), %ymm22
-# INTEL: vrsqrtpbf16 ymm22, ymmword ptr [2*rbp - 1024]
+# ATT: vrsqrtbf16 -1024(,%rbp,2), %ymm22
+# INTEL: vrsqrtbf16 ymm22, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x7c,0x28,0x4e,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vrsqrtpbf16 4064(%rcx), %ymm22 {%k7} {z}
-# INTEL: vrsqrtpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
+# ATT: vrsqrtbf16 4064(%rcx), %ymm22 {%k7} {z}
+# INTEL: vrsqrtbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
0x62,0xe6,0x7c,0xaf,0x4e,0x71,0x7f
-# ATT: vrsqrtpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
-# INTEL: vrsqrtpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
+# ATT: vrsqrtbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
+# INTEL: vrsqrtbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x7c,0xbf,0x4e,0x72,0x80
-# ATT: vrsqrtpbf16 268435456(%rbp,%r14,8), %zmm22
-# INTEL: vrsqrtpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vrsqrtbf16 268435456(%rbp,%r14,8), %zmm22
+# INTEL: vrsqrtbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x7c,0x48,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vrsqrtpbf16 291(%r8,%rax,4), %zmm22 {%k7}
-# INTEL: vrsqrtpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vrsqrtbf16 291(%r8,%rax,4), %zmm22 {%k7}
+# INTEL: vrsqrtbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x7c,0x4f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vrsqrtpbf16 (%rip){1to32}, %zmm22
-# INTEL: vrsqrtpbf16 zmm22, word ptr [rip]{1to32}
+# ATT: vrsqrtbf16 (%rip){1to32}, %zmm22
+# INTEL: vrsqrtbf16 zmm22, word ptr [rip]{1to32}
0x62,0xe6,0x7c,0x58,0x4e,0x35,0x00,0x00,0x00,0x00
-# ATT: vrsqrtpbf16 -2048(,%rbp,2), %zmm22
-# INTEL: vrsqrtpbf16 zmm22, zmmword ptr [2*rbp - 2048]
+# ATT: vrsqrtbf16 -2048(,%rbp,2), %zmm22
+# INTEL: vrsqrtbf16 zmm22, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x7c,0x48,0x4e,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vrsqrtpbf16 8128(%rcx), %zmm22 {%k7} {z}
-# INTEL: vrsqrtpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
+# ATT: vrsqrtbf16 8128(%rcx), %zmm22 {%k7} {z}
+# INTEL: vrsqrtbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
0x62,0xe6,0x7c,0xcf,0x4e,0x71,0x7f
-# ATT: vrsqrtpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
-# INTEL: vrsqrtpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
+# ATT: vrsqrtbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
+# INTEL: vrsqrtbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x7c,0xdf,0x4e,0x72,0x80
-# ATT: vscalefpbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vscalefpbf16 ymm22, ymm23, ymm24
+# ATT: vscalefbf16 %ymm24, %ymm23, %ymm22
+# INTEL: vscalefbf16 ymm22, ymm23, ymm24
0x62,0x86,0x44,0x20,0x2c,0xf0
-# ATT: vscalefpbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vscalefpbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vscalefbf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vscalefbf16 ymm22 {k7}, ymm23, ymm24
0x62,0x86,0x44,0x27,0x2c,0xf0
-# ATT: vscalefpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vscalefpbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vscalefbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vscalefbf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x86,0x44,0xa7,0x2c,0xf0
-# ATT: vscalefpbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vscalefpbf16 zmm22, zmm23, zmm24
+# ATT: vscalefbf16 %zmm24, %zmm23, %zmm22
+# INTEL: vscalefbf16 zmm22, zmm23, zmm24
0x62,0x86,0x44,0x40,0x2c,0xf0
-# ATT: vscalefpbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vscalefpbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vscalefbf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vscalefbf16 zmm22 {k7}, zmm23, zmm24
0x62,0x86,0x44,0x47,0x2c,0xf0
-# ATT: vscalefpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vscalefpbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vscalefbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vscalefbf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x86,0x44,0xc7,0x2c,0xf0
-# ATT: vscalefpbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vscalefpbf16 xmm22, xmm23, xmm24
+# ATT: vscalefbf16 %xmm24, %xmm23, %xmm22
+# INTEL: vscalefbf16 xmm22, xmm23, xmm24
0x62,0x86,0x44,0x00,0x2c,0xf0
-# ATT: vscalefpbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vscalefpbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vscalefbf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vscalefbf16 xmm22 {k7}, xmm23, xmm24
0x62,0x86,0x44,0x07,0x2c,0xf0
-# ATT: vscalefpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vscalefpbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vscalefbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vscalefbf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x86,0x44,0x87,0x2c,0xf0
-# ATT: vscalefpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vscalefpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vscalefbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vscalefbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x40,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vscalefpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vscalefpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vscalefbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vscalefbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x47,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vscalefpbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vscalefpbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vscalefbf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vscalefbf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe6,0x44,0x50,0x2c,0x35,0x00,0x00,0x00,0x00
-# ATT: vscalefpbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vscalefpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vscalefbf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vscalefbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe6,0x44,0x40,0x2c,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vscalefpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vscalefpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vscalefbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vscalefbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe6,0x44,0xc7,0x2c,0x71,0x7f
-# ATT: vscalefpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vscalefpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vscalefbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vscalefbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe6,0x44,0xd7,0x2c,0x72,0x80
-# ATT: vscalefpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vscalefpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vscalefbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vscalefbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x20,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vscalefpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vscalefpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vscalefbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vscalefbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x27,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vscalefpbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vscalefpbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vscalefbf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vscalefbf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe6,0x44,0x30,0x2c,0x35,0x00,0x00,0x00,0x00
-# ATT: vscalefpbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vscalefpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vscalefbf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vscalefbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe6,0x44,0x20,0x2c,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vscalefpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vscalefpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vscalefbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vscalefbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe6,0x44,0xa7,0x2c,0x71,0x7f
-# ATT: vscalefpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vscalefpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vscalefbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vscalefbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe6,0x44,0xb7,0x2c,0x72,0x80
-# ATT: vscalefpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vscalefpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vscalefbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vscalefbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa6,0x44,0x00,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vscalefpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vscalefpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vscalefbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vscalefbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc6,0x44,0x07,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vscalefpbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vscalefpbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vscalefbf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vscalefbf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe6,0x44,0x10,0x2c,0x35,0x00,0x00,0x00,0x00
-# ATT: vscalefpbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vscalefpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vscalefbf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vscalefbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe6,0x44,0x00,0x2c,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vscalefpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vscalefpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vscalefbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vscalefbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe6,0x44,0x87,0x2c,0x71,0x7f
-# ATT: vscalefpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vscalefpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vscalefbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vscalefbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe6,0x44,0x97,0x2c,0x72,0x80
-# ATT: vsqrtnepbf16 %xmm23, %xmm22
-# INTEL: vsqrtnepbf16 xmm22, xmm23
+# ATT: vsqrtbf16 %xmm23, %xmm22
+# INTEL: vsqrtbf16 xmm22, xmm23
0x62,0xa5,0x7d,0x08,0x51,0xf7
-# ATT: vsqrtnepbf16 %xmm23, %xmm22 {%k7}
-# INTEL: vsqrtnepbf16 xmm22 {k7}, xmm23
+# ATT: vsqrtbf16 %xmm23, %xmm22 {%k7}
+# INTEL: vsqrtbf16 xmm22 {k7}, xmm23
0x62,0xa5,0x7d,0x0f,0x51,0xf7
-# ATT: vsqrtnepbf16 %xmm23, %xmm22 {%k7} {z}
-# INTEL: vsqrtnepbf16 xmm22 {k7} {z}, xmm23
+# ATT: vsqrtbf16 %xmm23, %xmm22 {%k7} {z}
+# INTEL: vsqrtbf16 xmm22 {k7} {z}, xmm23
0x62,0xa5,0x7d,0x8f,0x51,0xf7
-# ATT: vsqrtnepbf16 %zmm23, %zmm22
-# INTEL: vsqrtnepbf16 zmm22, zmm23
+# ATT: vsqrtbf16 %zmm23, %zmm22
+# INTEL: vsqrtbf16 zmm22, zmm23
0x62,0xa5,0x7d,0x48,0x51,0xf7
-# ATT: vsqrtnepbf16 %zmm23, %zmm22 {%k7}
-# INTEL: vsqrtnepbf16 zmm22 {k7}, zmm23
+# ATT: vsqrtbf16 %zmm23, %zmm22 {%k7}
+# INTEL: vsqrtbf16 zmm22 {k7}, zmm23
0x62,0xa5,0x7d,0x4f,0x51,0xf7
-# ATT: vsqrtnepbf16 %zmm23, %zmm22 {%k7} {z}
-# INTEL: vsqrtnepbf16 zmm22 {k7} {z}, zmm23
+# ATT: vsqrtbf16 %zmm23, %zmm22 {%k7} {z}
+# INTEL: vsqrtbf16 zmm22 {k7} {z}, zmm23
0x62,0xa5,0x7d,0xcf,0x51,0xf7
-# ATT: vsqrtnepbf16 %ymm23, %ymm22
-# INTEL: vsqrtnepbf16 ymm22, ymm23
+# ATT: vsqrtbf16 %ymm23, %ymm22
+# INTEL: vsqrtbf16 ymm22, ymm23
0x62,0xa5,0x7d,0x28,0x51,0xf7
-# ATT: vsqrtnepbf16 %ymm23, %ymm22 {%k7}
-# INTEL: vsqrtnepbf16 ymm22 {k7}, ymm23
+# ATT: vsqrtbf16 %ymm23, %ymm22 {%k7}
+# INTEL: vsqrtbf16 ymm22 {k7}, ymm23
0x62,0xa5,0x7d,0x2f,0x51,0xf7
-# ATT: vsqrtnepbf16 %ymm23, %ymm22 {%k7} {z}
-# INTEL: vsqrtnepbf16 ymm22 {k7} {z}, ymm23
+# ATT: vsqrtbf16 %ymm23, %ymm22 {%k7} {z}
+# INTEL: vsqrtbf16 ymm22 {k7} {z}, ymm23
0x62,0xa5,0x7d,0xaf,0x51,0xf7
-# ATT: vsqrtnepbf16 268435456(%rbp,%r14,8), %xmm22
-# INTEL: vsqrtnepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vsqrtbf16 268435456(%rbp,%r14,8), %xmm22
+# INTEL: vsqrtbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x7d,0x08,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vsqrtnepbf16 291(%r8,%rax,4), %xmm22 {%k7}
-# INTEL: vsqrtnepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vsqrtbf16 291(%r8,%rax,4), %xmm22 {%k7}
+# INTEL: vsqrtbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x7d,0x0f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vsqrtnepbf16 (%rip){1to8}, %xmm22
-# INTEL: vsqrtnepbf16 xmm22, word ptr [rip]{1to8}
+# ATT: vsqrtbf16 (%rip){1to8}, %xmm22
+# INTEL: vsqrtbf16 xmm22, word ptr [rip]{1to8}
0x62,0xe5,0x7d,0x18,0x51,0x35,0x00,0x00,0x00,0x00
-# ATT: vsqrtnepbf16 -512(,%rbp,2), %xmm22
-# INTEL: vsqrtnepbf16 xmm22, xmmword ptr [2*rbp - 512]
+# ATT: vsqrtbf16 -512(,%rbp,2), %xmm22
+# INTEL: vsqrtbf16 xmm22, xmmword ptr [2*rbp - 512]
0x62,0xe5,0x7d,0x08,0x51,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vsqrtnepbf16 2032(%rcx), %xmm22 {%k7} {z}
-# INTEL: vsqrtnepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
+# ATT: vsqrtbf16 2032(%rcx), %xmm22 {%k7} {z}
+# INTEL: vsqrtbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
0x62,0xe5,0x7d,0x8f,0x51,0x71,0x7f
-# ATT: vsqrtnepbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
-# INTEL: vsqrtnepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
+# ATT: vsqrtbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
+# INTEL: vsqrtbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
0x62,0xe5,0x7d,0x9f,0x51,0x72,0x80
-# ATT: vsqrtnepbf16 268435456(%rbp,%r14,8), %ymm22
-# INTEL: vsqrtnepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vsqrtbf16 268435456(%rbp,%r14,8), %ymm22
+# INTEL: vsqrtbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x7d,0x28,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vsqrtnepbf16 291(%r8,%rax,4), %ymm22 {%k7}
-# INTEL: vsqrtnepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vsqrtbf16 291(%r8,%rax,4), %ymm22 {%k7}
+# INTEL: vsqrtbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x7d,0x2f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vsqrtnepbf16 (%rip){1to16}, %ymm22
-# INTEL: vsqrtnepbf16 ymm22, word ptr [rip]{1to16}
+# ATT: vsqrtbf16 (%rip){1to16}, %ymm22
+# INTEL: vsqrtbf16 ymm22, word ptr [rip]{1to16}
0x62,0xe5,0x7d,0x38,0x51,0x35,0x00,0x00,0x00,0x00
-# ATT: vsqrtnepbf16 -1024(,%rbp,2), %ymm22
-# INTEL: vsqrtnepbf16 ymm22, ymmword ptr [2*rbp - 1024]
+# ATT: vsqrtbf16 -1024(,%rbp,2), %ymm22
+# INTEL: vsqrtbf16 ymm22, ymmword ptr [2*rbp - 1024]
0x62,0xe5,0x7d,0x28,0x51,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vsqrtnepbf16 4064(%rcx), %ymm22 {%k7} {z}
-# INTEL: vsqrtnepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
+# ATT: vsqrtbf16 4064(%rcx), %ymm22 {%k7} {z}
+# INTEL: vsqrtbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
0x62,0xe5,0x7d,0xaf,0x51,0x71,0x7f
-# ATT: vsqrtnepbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
-# INTEL: vsqrtnepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
+# ATT: vsqrtbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
+# INTEL: vsqrtbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
0x62,0xe5,0x7d,0xbf,0x51,0x72,0x80
-# ATT: vsqrtnepbf16 268435456(%rbp,%r14,8), %zmm22
-# INTEL: vsqrtnepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vsqrtbf16 268435456(%rbp,%r14,8), %zmm22
+# INTEL: vsqrtbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x7d,0x48,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vsqrtnepbf16 291(%r8,%rax,4), %zmm22 {%k7}
-# INTEL: vsqrtnepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vsqrtbf16 291(%r8,%rax,4), %zmm22 {%k7}
+# INTEL: vsqrtbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x7d,0x4f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vsqrtnepbf16 (%rip){1to32}, %zmm22
-# INTEL: vsqrtnepbf16 zmm22, word ptr [rip]{1to32}
+# ATT: vsqrtbf16 (%rip){1to32}, %zmm22
+# INTEL: vsqrtbf16 zmm22, word ptr [rip]{1to32}
0x62,0xe5,0x7d,0x58,0x51,0x35,0x00,0x00,0x00,0x00
-# ATT: vsqrtnepbf16 -2048(,%rbp,2), %zmm22
-# INTEL: vsqrtnepbf16 zmm22, zmmword ptr [2*rbp - 2048]
+# ATT: vsqrtbf16 -2048(,%rbp,2), %zmm22
+# INTEL: vsqrtbf16 zmm22, zmmword ptr [2*rbp - 2048]
0x62,0xe5,0x7d,0x48,0x51,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vsqrtnepbf16 8128(%rcx), %zmm22 {%k7} {z}
-# INTEL: vsqrtnepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
+# ATT: vsqrtbf16 8128(%rcx), %zmm22 {%k7} {z}
+# INTEL: vsqrtbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
0x62,0xe5,0x7d,0xcf,0x51,0x71,0x7f
-# ATT: vsqrtnepbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
-# INTEL: vsqrtnepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
+# ATT: vsqrtbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
+# INTEL: vsqrtbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
0x62,0xe5,0x7d,0xdf,0x51,0x72,0x80
-# ATT: vsubnepbf16 %ymm24, %ymm23, %ymm22
-# INTEL: vsubnepbf16 ymm22, ymm23, ymm24
+# ATT: vsubbf16 %ymm24, %ymm23, %ymm22
+# INTEL: vsubbf16 ymm22, ymm23, ymm24
0x62,0x85,0x45,0x20,0x5c,0xf0
-# ATT: vsubnepbf16 %ymm24, %ymm23, %ymm22 {%k7}
-# INTEL: vsubnepbf16 ymm22 {k7}, ymm23, ymm24
+# ATT: vsubbf16 %ymm24, %ymm23, %ymm22 {%k7}
+# INTEL: vsubbf16 ymm22 {k7}, ymm23, ymm24
0x62,0x85,0x45,0x27,0x5c,0xf0
-# ATT: vsubnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vsubnepbf16 ymm22 {k7} {z}, ymm23, ymm24
+# ATT: vsubbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vsubbf16 ymm22 {k7} {z}, ymm23, ymm24
0x62,0x85,0x45,0xa7,0x5c,0xf0
-# ATT: vsubnepbf16 %zmm24, %zmm23, %zmm22
-# INTEL: vsubnepbf16 zmm22, zmm23, zmm24
+# ATT: vsubbf16 %zmm24, %zmm23, %zmm22
+# INTEL: vsubbf16 zmm22, zmm23, zmm24
0x62,0x85,0x45,0x40,0x5c,0xf0
-# ATT: vsubnepbf16 %zmm24, %zmm23, %zmm22 {%k7}
-# INTEL: vsubnepbf16 zmm22 {k7}, zmm23, zmm24
+# ATT: vsubbf16 %zmm24, %zmm23, %zmm22 {%k7}
+# INTEL: vsubbf16 zmm22 {k7}, zmm23, zmm24
0x62,0x85,0x45,0x47,0x5c,0xf0
-# ATT: vsubnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vsubnepbf16 zmm22 {k7} {z}, zmm23, zmm24
+# ATT: vsubbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vsubbf16 zmm22 {k7} {z}, zmm23, zmm24
0x62,0x85,0x45,0xc7,0x5c,0xf0
-# ATT: vsubnepbf16 %xmm24, %xmm23, %xmm22
-# INTEL: vsubnepbf16 xmm22, xmm23, xmm24
+# ATT: vsubbf16 %xmm24, %xmm23, %xmm22
+# INTEL: vsubbf16 xmm22, xmm23, xmm24
0x62,0x85,0x45,0x00,0x5c,0xf0
-# ATT: vsubnepbf16 %xmm24, %xmm23, %xmm22 {%k7}
-# INTEL: vsubnepbf16 xmm22 {k7}, xmm23, xmm24
+# ATT: vsubbf16 %xmm24, %xmm23, %xmm22 {%k7}
+# INTEL: vsubbf16 xmm22 {k7}, xmm23, xmm24
0x62,0x85,0x45,0x07,0x5c,0xf0
-# ATT: vsubnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vsubnepbf16 xmm22 {k7} {z}, xmm23, xmm24
+# ATT: vsubbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vsubbf16 xmm22 {k7} {z}, xmm23, xmm24
0x62,0x85,0x45,0x87,0x5c,0xf0
-# ATT: vsubnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-# INTEL: vsubnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vsubbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+# INTEL: vsubbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x40,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vsubnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-# INTEL: vsubnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+# ATT: vsubbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+# INTEL: vsubbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x47,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vsubnepbf16 (%rip){1to32}, %zmm23, %zmm22
-# INTEL: vsubnepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+# ATT: vsubbf16 (%rip){1to32}, %zmm23, %zmm22
+# INTEL: vsubbf16 zmm22, zmm23, word ptr [rip]{1to32}
0x62,0xe5,0x45,0x50,0x5c,0x35,0x00,0x00,0x00,0x00
-# ATT: vsubnepbf16 -2048(,%rbp,2), %zmm23, %zmm22
-# INTEL: vsubnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+# ATT: vsubbf16 -2048(,%rbp,2), %zmm23, %zmm22
+# INTEL: vsubbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
0x62,0xe5,0x45,0x40,0x5c,0x34,0x6d,0x00,0xf8,0xff,0xff
-# ATT: vsubnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-# INTEL: vsubnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+# ATT: vsubbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+# INTEL: vsubbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
0x62,0xe5,0x45,0xc7,0x5c,0x71,0x7f
-# ATT: vsubnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-# INTEL: vsubnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+# ATT: vsubbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+# INTEL: vsubbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
0x62,0xe5,0x45,0xd7,0x5c,0x72,0x80
-# ATT: vsubnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-# INTEL: vsubnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vsubbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+# INTEL: vsubbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x20,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vsubnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-# INTEL: vsubnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+# ATT: vsubbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+# INTEL: vsubbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x27,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vsubnepbf16 (%rip){1to16}, %ymm23, %ymm22
-# INTEL: vsubnepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+# ATT: vsubbf16 (%rip){1to16}, %ymm23, %ymm22
+# INTEL: vsubbf16 ymm22, ymm23, word ptr [rip]{1to16}
0x62,0xe5,0x45,0x30,0x5c,0x35,0x00,0x00,0x00,0x00
-# ATT: vsubnepbf16 -1024(,%rbp,2), %ymm23, %ymm22
-# INTEL: vsubnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+# ATT: vsubbf16 -1024(,%rbp,2), %ymm23, %ymm22
+# INTEL: vsubbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
0x62,0xe5,0x45,0x20,0x5c,0x34,0x6d,0x00,0xfc,0xff,0xff
-# ATT: vsubnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-# INTEL: vsubnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+# ATT: vsubbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+# INTEL: vsubbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
0x62,0xe5,0x45,0xa7,0x5c,0x71,0x7f
-# ATT: vsubnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-# INTEL: vsubnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+# ATT: vsubbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+# INTEL: vsubbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
0x62,0xe5,0x45,0xb7,0x5c,0x72,0x80
-# ATT: vsubnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-# INTEL: vsubnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+# ATT: vsubbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+# INTEL: vsubbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
0x62,0xa5,0x45,0x00,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10
-# ATT: vsubnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-# INTEL: vsubnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+# ATT: vsubbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+# INTEL: vsubbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
0x62,0xc5,0x45,0x07,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00
-# ATT: vsubnepbf16 (%rip){1to8}, %xmm23, %xmm22
-# INTEL: vsubnepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+# ATT: vsubbf16 (%rip){1to8}, %xmm23, %xmm22
+# INTEL: vsubbf16 xmm22, xmm23, word ptr [rip]{1to8}
0x62,0xe5,0x45,0x10,0x5c,0x35,0x00,0x00,0x00,0x00
-# ATT: vsubnepbf16 -512(,%rbp,2), %xmm23, %xmm22
-# INTEL: vsubnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+# ATT: vsubbf16 -512(,%rbp,2), %xmm23, %xmm22
+# INTEL: vsubbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
0x62,0xe5,0x45,0x00,0x5c,0x34,0x6d,0x00,0xfe,0xff,0xff
-# ATT: vsubnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-# INTEL: vsubnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+# ATT: vsubbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+# INTEL: vsubbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
0x62,0xe5,0x45,0x87,0x5c,0x71,0x7f
-# ATT: vsubnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-# INTEL: vsubnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+# ATT: vsubbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+# INTEL: vsubbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
0x62,0xe5,0x45,0x97,0x5c,0x72,0x80
diff --git a/llvm/test/MC/X86/avx10.2-bf16-32-att.s b/llvm/test/MC/X86/avx10.2-bf16-32-att.s
index 9f62743177c9bd..6b4f23c1ec01dd 100644
--- a/llvm/test/MC/X86/avx10.2-bf16-32-att.s
+++ b/llvm/test/MC/X86/avx10.2-bf16-32-att.s
@@ -1,208 +1,208 @@
// RUN: llvm-mc -triple i386 --show-encoding %s | FileCheck %s
-// CHECK: vaddnepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vaddbf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x58,0xd4]
- vaddnepbf16 %ymm4, %ymm3, %ymm2
+ vaddbf16 %ymm4, %ymm3, %ymm2
-// CHECK: vaddnepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vaddbf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x58,0xd4]
- vaddnepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vaddbf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vaddnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vaddbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x58,0xd4]
- vaddnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vaddbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vaddnepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vaddbf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x58,0xd4]
- vaddnepbf16 %zmm4, %zmm3, %zmm2
+ vaddbf16 %zmm4, %zmm3, %zmm2
-// CHECK: vaddnepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vaddbf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x58,0xd4]
- vaddnepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vaddbf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vaddnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vaddbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x58,0xd4]
- vaddnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vaddbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vaddnepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vaddbf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x58,0xd4]
- vaddnepbf16 %xmm4, %xmm3, %xmm2
+ vaddbf16 %xmm4, %xmm3, %xmm2
-// CHECK: vaddnepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vaddbf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x58,0xd4]
- vaddnepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vaddbf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vaddnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vaddbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x58,0xd4]
- vaddnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vaddbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vaddnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vaddbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x58,0x94,0xf4,0x00,0x00,0x00,0x10]
- vaddnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vaddbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vaddnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vaddbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x58,0x94,0x87,0x23,0x01,0x00,0x00]
- vaddnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vaddbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vaddnepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vaddbf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x58,0x58,0x10]
- vaddnepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vaddbf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vaddnepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vaddbf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x58,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vaddnepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vaddbf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vaddnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vaddbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x58,0x51,0x7f]
- vaddnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vaddbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vaddnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vaddbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x58,0x52,0x80]
- vaddnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vaddbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vaddnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vaddbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x58,0x94,0xf4,0x00,0x00,0x00,0x10]
- vaddnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vaddbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vaddnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vaddbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x58,0x94,0x87,0x23,0x01,0x00,0x00]
- vaddnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vaddbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vaddnepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vaddbf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x38,0x58,0x10]
- vaddnepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vaddbf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vaddnepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vaddbf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x58,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vaddnepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vaddbf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vaddnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vaddbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x58,0x51,0x7f]
- vaddnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vaddbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vaddnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vaddbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x58,0x52,0x80]
- vaddnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vaddbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vaddnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vaddbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x58,0x94,0xf4,0x00,0x00,0x00,0x10]
- vaddnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vaddbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vaddnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vaddbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x58,0x94,0x87,0x23,0x01,0x00,0x00]
- vaddnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vaddbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vaddnepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vaddbf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x18,0x58,0x10]
- vaddnepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vaddbf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vaddnepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vaddbf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x58,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vaddnepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vaddbf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vaddnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vaddbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x58,0x51,0x7f]
- vaddnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vaddbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vaddnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vaddbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x58,0x52,0x80]
- vaddnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vaddbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vcmppbf16 $123, %ymm4, %ymm3, %k5
+// CHECK: vcmpbf16 $123, %ymm4, %ymm3, %k5
// CHECK: encoding: [0x62,0xf3,0x67,0x28,0xc2,0xec,0x7b]
- vcmppbf16 $123, %ymm4, %ymm3, %k5
+ vcmpbf16 $123, %ymm4, %ymm3, %k5
-// CHECK: vcmppbf16 $123, %ymm4, %ymm3, %k5 {%k7}
+// CHECK: vcmpbf16 $123, %ymm4, %ymm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x67,0x2f,0xc2,0xec,0x7b]
- vcmppbf16 $123, %ymm4, %ymm3, %k5 {%k7}
+ vcmpbf16 $123, %ymm4, %ymm3, %k5 {%k7}
-// CHECK: vcmppbf16 $123, %xmm4, %xmm3, %k5
+// CHECK: vcmpbf16 $123, %xmm4, %xmm3, %k5
// CHECK: encoding: [0x62,0xf3,0x67,0x08,0xc2,0xec,0x7b]
- vcmppbf16 $123, %xmm4, %xmm3, %k5
+ vcmpbf16 $123, %xmm4, %xmm3, %k5
-// CHECK: vcmppbf16 $123, %xmm4, %xmm3, %k5 {%k7}
+// CHECK: vcmpbf16 $123, %xmm4, %xmm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x67,0x0f,0xc2,0xec,0x7b]
- vcmppbf16 $123, %xmm4, %xmm3, %k5 {%k7}
+ vcmpbf16 $123, %xmm4, %xmm3, %k5 {%k7}
-// CHECK: vcmppbf16 $123, %zmm4, %zmm3, %k5
+// CHECK: vcmpbf16 $123, %zmm4, %zmm3, %k5
// CHECK: encoding: [0x62,0xf3,0x67,0x48,0xc2,0xec,0x7b]
- vcmppbf16 $123, %zmm4, %zmm3, %k5
+ vcmpbf16 $123, %zmm4, %zmm3, %k5
-// CHECK: vcmppbf16 $123, %zmm4, %zmm3, %k5 {%k7}
+// CHECK: vcmpbf16 $123, %zmm4, %zmm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x67,0x4f,0xc2,0xec,0x7b]
- vcmppbf16 $123, %zmm4, %zmm3, %k5 {%k7}
+ vcmpbf16 $123, %zmm4, %zmm3, %k5 {%k7}
-// CHECK: vcmppbf16 $123, 268435456(%esp,%esi,8), %zmm3, %k5
+// CHECK: vcmpbf16 $123, 268435456(%esp,%esi,8), %zmm3, %k5
// CHECK: encoding: [0x62,0xf3,0x67,0x48,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vcmppbf16 $123, 268435456(%esp,%esi,8), %zmm3, %k5
+ vcmpbf16 $123, 268435456(%esp,%esi,8), %zmm3, %k5
-// CHECK: vcmppbf16 $123, 291(%edi,%eax,4), %zmm3, %k5 {%k7}
+// CHECK: vcmpbf16 $123, 291(%edi,%eax,4), %zmm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x67,0x4f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b]
- vcmppbf16 $123, 291(%edi,%eax,4), %zmm3, %k5 {%k7}
+ vcmpbf16 $123, 291(%edi,%eax,4), %zmm3, %k5 {%k7}
-// CHECK: vcmppbf16 $123, (%eax){1to32}, %zmm3, %k5
+// CHECK: vcmpbf16 $123, (%eax){1to32}, %zmm3, %k5
// CHECK: encoding: [0x62,0xf3,0x67,0x58,0xc2,0x28,0x7b]
- vcmppbf16 $123, (%eax){1to32}, %zmm3, %k5
+ vcmpbf16 $123, (%eax){1to32}, %zmm3, %k5
-// CHECK: vcmppbf16 $123, -2048(,%ebp,2), %zmm3, %k5
+// CHECK: vcmpbf16 $123, -2048(,%ebp,2), %zmm3, %k5
// CHECK: encoding: [0x62,0xf3,0x67,0x48,0xc2,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vcmppbf16 $123, -2048(,%ebp,2), %zmm3, %k5
+ vcmpbf16 $123, -2048(,%ebp,2), %zmm3, %k5
-// CHECK: vcmppbf16 $123, 8128(%ecx), %zmm3, %k5 {%k7}
+// CHECK: vcmpbf16 $123, 8128(%ecx), %zmm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x67,0x4f,0xc2,0x69,0x7f,0x7b]
- vcmppbf16 $123, 8128(%ecx), %zmm3, %k5 {%k7}
+ vcmpbf16 $123, 8128(%ecx), %zmm3, %k5 {%k7}
-// CHECK: vcmppbf16 $123, -256(%edx){1to32}, %zmm3, %k5 {%k7}
+// CHECK: vcmpbf16 $123, -256(%edx){1to32}, %zmm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x67,0x5f,0xc2,0x6a,0x80,0x7b]
- vcmppbf16 $123, -256(%edx){1to32}, %zmm3, %k5 {%k7}
+ vcmpbf16 $123, -256(%edx){1to32}, %zmm3, %k5 {%k7}
-// CHECK: vcmppbf16 $123, 268435456(%esp,%esi,8), %xmm3, %k5
+// CHECK: vcmpbf16 $123, 268435456(%esp,%esi,8), %xmm3, %k5
// CHECK: encoding: [0x62,0xf3,0x67,0x08,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vcmppbf16 $123, 268435456(%esp,%esi,8), %xmm3, %k5
+ vcmpbf16 $123, 268435456(%esp,%esi,8), %xmm3, %k5
-// CHECK: vcmppbf16 $123, 291(%edi,%eax,4), %xmm3, %k5 {%k7}
+// CHECK: vcmpbf16 $123, 291(%edi,%eax,4), %xmm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x67,0x0f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b]
- vcmppbf16 $123, 291(%edi,%eax,4), %xmm3, %k5 {%k7}
+ vcmpbf16 $123, 291(%edi,%eax,4), %xmm3, %k5 {%k7}
-// CHECK: vcmppbf16 $123, (%eax){1to8}, %xmm3, %k5
+// CHECK: vcmpbf16 $123, (%eax){1to8}, %xmm3, %k5
// CHECK: encoding: [0x62,0xf3,0x67,0x18,0xc2,0x28,0x7b]
- vcmppbf16 $123, (%eax){1to8}, %xmm3, %k5
+ vcmpbf16 $123, (%eax){1to8}, %xmm3, %k5
-// CHECK: vcmppbf16 $123, -512(,%ebp,2), %xmm3, %k5
+// CHECK: vcmpbf16 $123, -512(,%ebp,2), %xmm3, %k5
// CHECK: encoding: [0x62,0xf3,0x67,0x08,0xc2,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vcmppbf16 $123, -512(,%ebp,2), %xmm3, %k5
+ vcmpbf16 $123, -512(,%ebp,2), %xmm3, %k5
-// CHECK: vcmppbf16 $123, 2032(%ecx), %xmm3, %k5 {%k7}
+// CHECK: vcmpbf16 $123, 2032(%ecx), %xmm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x67,0x0f,0xc2,0x69,0x7f,0x7b]
- vcmppbf16 $123, 2032(%ecx), %xmm3, %k5 {%k7}
+ vcmpbf16 $123, 2032(%ecx), %xmm3, %k5 {%k7}
-// CHECK: vcmppbf16 $123, -256(%edx){1to8}, %xmm3, %k5 {%k7}
+// CHECK: vcmpbf16 $123, -256(%edx){1to8}, %xmm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x67,0x1f,0xc2,0x6a,0x80,0x7b]
- vcmppbf16 $123, -256(%edx){1to8}, %xmm3, %k5 {%k7}
+ vcmpbf16 $123, -256(%edx){1to8}, %xmm3, %k5 {%k7}
-// CHECK: vcmppbf16 $123, 268435456(%esp,%esi,8), %ymm3, %k5
+// CHECK: vcmpbf16 $123, 268435456(%esp,%esi,8), %ymm3, %k5
// CHECK: encoding: [0x62,0xf3,0x67,0x28,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vcmppbf16 $123, 268435456(%esp,%esi,8), %ymm3, %k5
+ vcmpbf16 $123, 268435456(%esp,%esi,8), %ymm3, %k5
-// CHECK: vcmppbf16 $123, 291(%edi,%eax,4), %ymm3, %k5 {%k7}
+// CHECK: vcmpbf16 $123, 291(%edi,%eax,4), %ymm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x67,0x2f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b]
- vcmppbf16 $123, 291(%edi,%eax,4), %ymm3, %k5 {%k7}
+ vcmpbf16 $123, 291(%edi,%eax,4), %ymm3, %k5 {%k7}
-// CHECK: vcmppbf16 $123, (%eax){1to16}, %ymm3, %k5
+// CHECK: vcmpbf16 $123, (%eax){1to16}, %ymm3, %k5
// CHECK: encoding: [0x62,0xf3,0x67,0x38,0xc2,0x28,0x7b]
- vcmppbf16 $123, (%eax){1to16}, %ymm3, %k5
+ vcmpbf16 $123, (%eax){1to16}, %ymm3, %k5
-// CHECK: vcmppbf16 $123, -1024(,%ebp,2), %ymm3, %k5
+// CHECK: vcmpbf16 $123, -1024(,%ebp,2), %ymm3, %k5
// CHECK: encoding: [0x62,0xf3,0x67,0x28,0xc2,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vcmppbf16 $123, -1024(,%ebp,2), %ymm3, %k5
+ vcmpbf16 $123, -1024(,%ebp,2), %ymm3, %k5
-// CHECK: vcmppbf16 $123, 4064(%ecx), %ymm3, %k5 {%k7}
+// CHECK: vcmpbf16 $123, 4064(%ecx), %ymm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x67,0x2f,0xc2,0x69,0x7f,0x7b]
- vcmppbf16 $123, 4064(%ecx), %ymm3, %k5 {%k7}
+ vcmpbf16 $123, 4064(%ecx), %ymm3, %k5 {%k7}
-// CHECK: vcmppbf16 $123, -256(%edx){1to16}, %ymm3, %k5 {%k7}
+// CHECK: vcmpbf16 $123, -256(%edx){1to16}, %ymm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x67,0x3f,0xc2,0x6a,0x80,0x7b]
- vcmppbf16 $123, -256(%edx){1to16}, %ymm3, %k5 {%k7}
+ vcmpbf16 $123, -256(%edx){1to16}, %ymm3, %k5 {%k7}
// CHECK: vcomsbf16 %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x2f,0xd3]
@@ -232,2783 +232,2783 @@
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x2f,0x52,0x80]
vcomsbf16 -256(%edx), %xmm2
-// CHECK: vdivnepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vdivbf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5e,0xd4]
- vdivnepbf16 %ymm4, %ymm3, %ymm2
+ vdivbf16 %ymm4, %ymm3, %ymm2
-// CHECK: vdivnepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vdivbf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5e,0xd4]
- vdivnepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vdivbf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vdivnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vdivbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5e,0xd4]
- vdivnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vdivbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vdivnepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vdivbf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5e,0xd4]
- vdivnepbf16 %zmm4, %zmm3, %zmm2
+ vdivbf16 %zmm4, %zmm3, %zmm2
-// CHECK: vdivnepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vdivbf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5e,0xd4]
- vdivnepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vdivbf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vdivnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vdivbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5e,0xd4]
- vdivnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vdivbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vdivnepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vdivbf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5e,0xd4]
- vdivnepbf16 %xmm4, %xmm3, %xmm2
+ vdivbf16 %xmm4, %xmm3, %xmm2
-// CHECK: vdivnepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vdivbf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5e,0xd4]
- vdivnepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vdivbf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vdivnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vdivbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5e,0xd4]
- vdivnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vdivbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vdivnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vdivbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vdivnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vdivbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vdivnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vdivbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00]
- vdivnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vdivbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vdivnepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vdivbf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5e,0x10]
- vdivnepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vdivbf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vdivnepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vdivbf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5e,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vdivnepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vdivbf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vdivnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vdivbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5e,0x51,0x7f]
- vdivnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vdivbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vdivnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vdivbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5e,0x52,0x80]
- vdivnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vdivbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vdivnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vdivbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vdivnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vdivbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vdivnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vdivbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00]
- vdivnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vdivbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vdivnepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vdivbf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5e,0x10]
- vdivnepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vdivbf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vdivnepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vdivbf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5e,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vdivnepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vdivbf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vdivnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vdivbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5e,0x51,0x7f]
- vdivnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vdivbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vdivnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vdivbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5e,0x52,0x80]
- vdivnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vdivbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vdivnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vdivbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vdivnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vdivbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vdivnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vdivbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00]
- vdivnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vdivbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vdivnepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vdivbf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5e,0x10]
- vdivnepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vdivbf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vdivnepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vdivbf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5e,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vdivnepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vdivbf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vdivnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vdivbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5e,0x51,0x7f]
- vdivnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vdivbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vdivnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vdivbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5e,0x52,0x80]
- vdivnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vdivbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmadd132nepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vfmadd132bf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x98,0xd4]
- vfmadd132nepbf16 %ymm4, %ymm3, %ymm2
+ vfmadd132bf16 %ymm4, %ymm3, %ymm2
-// CHECK: vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vfmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x98,0xd4]
- vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vfmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x98,0xd4]
- vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vfmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmadd132nepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vfmadd132bf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x98,0xd4]
- vfmadd132nepbf16 %zmm4, %zmm3, %zmm2
+ vfmadd132bf16 %zmm4, %zmm3, %zmm2
-// CHECK: vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vfmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x98,0xd4]
- vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vfmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x98,0xd4]
- vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vfmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmadd132nepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vfmadd132bf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x98,0xd4]
- vfmadd132nepbf16 %xmm4, %xmm3, %xmm2
+ vfmadd132bf16 %xmm4, %xmm3, %xmm2
-// CHECK: vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vfmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x98,0xd4]
- vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vfmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x98,0xd4]
- vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vfmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmadd132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vfmadd132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x98,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vfmadd132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vfmadd132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vfmadd132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x98,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vfmadd132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vfmadd132nepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vfmadd132bf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0x98,0x10]
- vfmadd132nepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vfmadd132bf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vfmadd132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vfmadd132bf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x98,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfmadd132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vfmadd132bf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vfmadd132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmadd132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x98,0x51,0x7f]
- vfmadd132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vfmadd132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmadd132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmadd132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x98,0x52,0x80]
- vfmadd132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vfmadd132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmadd132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vfmadd132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x98,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vfmadd132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vfmadd132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vfmadd132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x98,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vfmadd132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vfmadd132nepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vfmadd132bf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0x98,0x10]
- vfmadd132nepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vfmadd132bf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vfmadd132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vfmadd132bf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x98,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfmadd132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vfmadd132bf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vfmadd132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmadd132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x98,0x51,0x7f]
- vfmadd132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vfmadd132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmadd132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmadd132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x98,0x52,0x80]
- vfmadd132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vfmadd132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmadd132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vfmadd132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x98,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vfmadd132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vfmadd132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vfmadd132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x98,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vfmadd132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vfmadd132nepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vfmadd132bf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0x98,0x10]
- vfmadd132nepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vfmadd132bf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vfmadd132nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vfmadd132bf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x98,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfmadd132nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vfmadd132bf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vfmadd132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmadd132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x98,0x51,0x7f]
- vfmadd132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vfmadd132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmadd132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmadd132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x98,0x52,0x80]
- vfmadd132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vfmadd132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmadd213nepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vfmadd213bf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xa8,0xd4]
- vfmadd213nepbf16 %ymm4, %ymm3, %ymm2
+ vfmadd213bf16 %ymm4, %ymm3, %ymm2
-// CHECK: vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vfmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xa8,0xd4]
- vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vfmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xa8,0xd4]
- vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vfmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmadd213nepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vfmadd213bf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xa8,0xd4]
- vfmadd213nepbf16 %zmm4, %zmm3, %zmm2
+ vfmadd213bf16 %zmm4, %zmm3, %zmm2
-// CHECK: vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vfmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xa8,0xd4]
- vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vfmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xa8,0xd4]
- vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vfmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmadd213nepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vfmadd213bf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xa8,0xd4]
- vfmadd213nepbf16 %xmm4, %xmm3, %xmm2
+ vfmadd213bf16 %xmm4, %xmm3, %xmm2
-// CHECK: vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vfmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xa8,0xd4]
- vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vfmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xa8,0xd4]
- vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vfmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmadd213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vfmadd213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vfmadd213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vfmadd213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vfmadd213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vfmadd213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vfmadd213nepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vfmadd213bf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xa8,0x10]
- vfmadd213nepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vfmadd213bf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vfmadd213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vfmadd213bf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xa8,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfmadd213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vfmadd213bf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vfmadd213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmadd213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xa8,0x51,0x7f]
- vfmadd213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vfmadd213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmadd213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmadd213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xa8,0x52,0x80]
- vfmadd213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vfmadd213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmadd213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vfmadd213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vfmadd213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vfmadd213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vfmadd213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vfmadd213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vfmadd213nepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vfmadd213bf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xa8,0x10]
- vfmadd213nepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vfmadd213bf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vfmadd213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vfmadd213bf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xa8,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfmadd213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vfmadd213bf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vfmadd213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmadd213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xa8,0x51,0x7f]
- vfmadd213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vfmadd213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmadd213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmadd213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xa8,0x52,0x80]
- vfmadd213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vfmadd213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmadd213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vfmadd213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vfmadd213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vfmadd213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vfmadd213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vfmadd213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vfmadd213nepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vfmadd213bf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xa8,0x10]
- vfmadd213nepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vfmadd213bf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vfmadd213nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vfmadd213bf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xa8,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfmadd213nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vfmadd213bf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vfmadd213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmadd213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xa8,0x51,0x7f]
- vfmadd213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vfmadd213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmadd213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmadd213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xa8,0x52,0x80]
- vfmadd213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vfmadd213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmadd231nepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vfmadd231bf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xb8,0xd4]
- vfmadd231nepbf16 %ymm4, %ymm3, %ymm2
+ vfmadd231bf16 %ymm4, %ymm3, %ymm2
-// CHECK: vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vfmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xb8,0xd4]
- vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vfmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xb8,0xd4]
- vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vfmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmadd231nepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vfmadd231bf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xb8,0xd4]
- vfmadd231nepbf16 %zmm4, %zmm3, %zmm2
+ vfmadd231bf16 %zmm4, %zmm3, %zmm2
-// CHECK: vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vfmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xb8,0xd4]
- vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vfmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xb8,0xd4]
- vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vfmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmadd231nepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vfmadd231bf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xb8,0xd4]
- vfmadd231nepbf16 %xmm4, %xmm3, %xmm2
+ vfmadd231bf16 %xmm4, %xmm3, %xmm2
-// CHECK: vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vfmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xb8,0xd4]
- vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vfmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xb8,0xd4]
- vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vfmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmadd231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vfmadd231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vfmadd231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vfmadd231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vfmadd231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vfmadd231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vfmadd231nepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vfmadd231bf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xb8,0x10]
- vfmadd231nepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vfmadd231bf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vfmadd231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vfmadd231bf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xb8,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfmadd231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vfmadd231bf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vfmadd231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmadd231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xb8,0x51,0x7f]
- vfmadd231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vfmadd231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmadd231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmadd231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xb8,0x52,0x80]
- vfmadd231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vfmadd231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmadd231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vfmadd231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vfmadd231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vfmadd231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vfmadd231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vfmadd231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vfmadd231nepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vfmadd231bf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xb8,0x10]
- vfmadd231nepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vfmadd231bf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vfmadd231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vfmadd231bf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xb8,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfmadd231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vfmadd231bf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vfmadd231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmadd231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xb8,0x51,0x7f]
- vfmadd231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vfmadd231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmadd231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmadd231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xb8,0x52,0x80]
- vfmadd231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vfmadd231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmadd231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vfmadd231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vfmadd231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vfmadd231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vfmadd231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vfmadd231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vfmadd231nepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vfmadd231bf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xb8,0x10]
- vfmadd231nepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vfmadd231bf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vfmadd231nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vfmadd231bf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xb8,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfmadd231nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vfmadd231bf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vfmadd231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmadd231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xb8,0x51,0x7f]
- vfmadd231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vfmadd231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmadd231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmadd231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xb8,0x52,0x80]
- vfmadd231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vfmadd231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmsub132nepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vfmsub132bf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9a,0xd4]
- vfmsub132nepbf16 %ymm4, %ymm3, %ymm2
+ vfmsub132bf16 %ymm4, %ymm3, %ymm2
-// CHECK: vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vfmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9a,0xd4]
- vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vfmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9a,0xd4]
- vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vfmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmsub132nepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vfmsub132bf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9a,0xd4]
- vfmsub132nepbf16 %zmm4, %zmm3, %zmm2
+ vfmsub132bf16 %zmm4, %zmm3, %zmm2
-// CHECK: vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vfmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9a,0xd4]
- vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vfmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9a,0xd4]
- vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vfmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmsub132nepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vfmsub132bf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9a,0xd4]
- vfmsub132nepbf16 %xmm4, %xmm3, %xmm2
+ vfmsub132bf16 %xmm4, %xmm3, %xmm2
-// CHECK: vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vfmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9a,0xd4]
- vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vfmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9a,0xd4]
- vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vfmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmsub132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vfmsub132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vfmsub132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vfmsub132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vfmsub132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vfmsub132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vfmsub132nepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vfmsub132bf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0x9a,0x10]
- vfmsub132nepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vfmsub132bf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vfmsub132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vfmsub132bf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9a,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfmsub132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vfmsub132bf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vfmsub132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmsub132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9a,0x51,0x7f]
- vfmsub132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vfmsub132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmsub132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmsub132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x9a,0x52,0x80]
- vfmsub132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vfmsub132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmsub132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vfmsub132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vfmsub132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vfmsub132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vfmsub132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vfmsub132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vfmsub132nepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vfmsub132bf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0x9a,0x10]
- vfmsub132nepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vfmsub132bf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vfmsub132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vfmsub132bf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9a,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfmsub132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vfmsub132bf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vfmsub132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmsub132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9a,0x51,0x7f]
- vfmsub132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vfmsub132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmsub132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmsub132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x9a,0x52,0x80]
- vfmsub132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vfmsub132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmsub132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vfmsub132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vfmsub132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vfmsub132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vfmsub132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vfmsub132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vfmsub132nepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vfmsub132bf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0x9a,0x10]
- vfmsub132nepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vfmsub132bf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vfmsub132nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vfmsub132bf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9a,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfmsub132nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vfmsub132bf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vfmsub132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmsub132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9a,0x51,0x7f]
- vfmsub132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vfmsub132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmsub132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmsub132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x9a,0x52,0x80]
- vfmsub132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vfmsub132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmsub213nepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vfmsub213bf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xaa,0xd4]
- vfmsub213nepbf16 %ymm4, %ymm3, %ymm2
+ vfmsub213bf16 %ymm4, %ymm3, %ymm2
-// CHECK: vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vfmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xaa,0xd4]
- vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vfmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xaa,0xd4]
- vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vfmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmsub213nepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vfmsub213bf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xaa,0xd4]
- vfmsub213nepbf16 %zmm4, %zmm3, %zmm2
+ vfmsub213bf16 %zmm4, %zmm3, %zmm2
-// CHECK: vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vfmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xaa,0xd4]
- vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vfmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xaa,0xd4]
- vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vfmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmsub213nepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vfmsub213bf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xaa,0xd4]
- vfmsub213nepbf16 %xmm4, %xmm3, %xmm2
+ vfmsub213bf16 %xmm4, %xmm3, %xmm2
-// CHECK: vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vfmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xaa,0xd4]
- vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vfmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xaa,0xd4]
- vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vfmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmsub213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vfmsub213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vfmsub213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vfmsub213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vfmsub213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vfmsub213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vfmsub213nepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vfmsub213bf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xaa,0x10]
- vfmsub213nepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vfmsub213bf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vfmsub213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vfmsub213bf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xaa,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfmsub213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vfmsub213bf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vfmsub213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmsub213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xaa,0x51,0x7f]
- vfmsub213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vfmsub213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmsub213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmsub213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xaa,0x52,0x80]
- vfmsub213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vfmsub213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmsub213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vfmsub213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vfmsub213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vfmsub213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vfmsub213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vfmsub213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vfmsub213nepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vfmsub213bf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xaa,0x10]
- vfmsub213nepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vfmsub213bf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vfmsub213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vfmsub213bf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xaa,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfmsub213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vfmsub213bf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vfmsub213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmsub213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xaa,0x51,0x7f]
- vfmsub213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vfmsub213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmsub213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmsub213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xaa,0x52,0x80]
- vfmsub213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vfmsub213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmsub213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vfmsub213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vfmsub213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vfmsub213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vfmsub213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vfmsub213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vfmsub213nepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vfmsub213bf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xaa,0x10]
- vfmsub213nepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vfmsub213bf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vfmsub213nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vfmsub213bf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xaa,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfmsub213nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vfmsub213bf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vfmsub213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmsub213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xaa,0x51,0x7f]
- vfmsub213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vfmsub213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmsub213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmsub213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xaa,0x52,0x80]
- vfmsub213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vfmsub213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmsub231nepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vfmsub231bf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xba,0xd4]
- vfmsub231nepbf16 %ymm4, %ymm3, %ymm2
+ vfmsub231bf16 %ymm4, %ymm3, %ymm2
-// CHECK: vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vfmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xba,0xd4]
- vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vfmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xba,0xd4]
- vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vfmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmsub231nepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vfmsub231bf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xba,0xd4]
- vfmsub231nepbf16 %zmm4, %zmm3, %zmm2
+ vfmsub231bf16 %zmm4, %zmm3, %zmm2
-// CHECK: vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vfmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xba,0xd4]
- vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vfmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xba,0xd4]
- vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vfmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmsub231nepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vfmsub231bf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xba,0xd4]
- vfmsub231nepbf16 %xmm4, %xmm3, %xmm2
+ vfmsub231bf16 %xmm4, %xmm3, %xmm2
-// CHECK: vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vfmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xba,0xd4]
- vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vfmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xba,0xd4]
- vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vfmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmsub231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vfmsub231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xba,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vfmsub231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vfmsub231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vfmsub231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xba,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vfmsub231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vfmsub231nepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vfmsub231bf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xba,0x10]
- vfmsub231nepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vfmsub231bf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vfmsub231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vfmsub231bf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xba,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfmsub231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vfmsub231bf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vfmsub231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmsub231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xba,0x51,0x7f]
- vfmsub231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vfmsub231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmsub231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfmsub231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xba,0x52,0x80]
- vfmsub231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vfmsub231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfmsub231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vfmsub231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xba,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vfmsub231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vfmsub231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vfmsub231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xba,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vfmsub231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vfmsub231nepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vfmsub231bf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xba,0x10]
- vfmsub231nepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vfmsub231bf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vfmsub231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vfmsub231bf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xba,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfmsub231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vfmsub231bf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vfmsub231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmsub231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xba,0x51,0x7f]
- vfmsub231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vfmsub231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmsub231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfmsub231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xba,0x52,0x80]
- vfmsub231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vfmsub231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfmsub231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vfmsub231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xba,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vfmsub231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vfmsub231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vfmsub231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xba,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vfmsub231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vfmsub231nepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vfmsub231bf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xba,0x10]
- vfmsub231nepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vfmsub231bf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vfmsub231nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vfmsub231bf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xba,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfmsub231nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vfmsub231bf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vfmsub231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmsub231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xba,0x51,0x7f]
- vfmsub231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vfmsub231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfmsub231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfmsub231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xba,0x52,0x80]
- vfmsub231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vfmsub231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vfnmadd132bf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9c,0xd4]
- vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2
+ vfnmadd132bf16 %ymm4, %ymm3, %ymm2
-// CHECK: vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vfnmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9c,0xd4]
- vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vfnmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9c,0xd4]
- vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vfnmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vfnmadd132bf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9c,0xd4]
- vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2
+ vfnmadd132bf16 %zmm4, %zmm3, %zmm2
-// CHECK: vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vfnmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9c,0xd4]
- vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vfnmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9c,0xd4]
- vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vfnmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vfnmadd132bf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9c,0xd4]
- vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2
+ vfnmadd132bf16 %xmm4, %xmm3, %xmm2
-// CHECK: vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vfnmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9c,0xd4]
- vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vfnmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9c,0xd4]
- vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vfnmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vfnmadd132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vfnmadd132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vfnmadd132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vfnmadd132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vfnmadd132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vfnmadd132nepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vfnmadd132bf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0x9c,0x10]
- vfnmadd132nepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vfnmadd132bf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vfnmadd132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vfnmadd132bf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9c,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfnmadd132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vfnmadd132bf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vfnmadd132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmadd132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9c,0x51,0x7f]
- vfnmadd132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vfnmadd132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmadd132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x9c,0x52,0x80]
- vfnmadd132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vfnmadd132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vfnmadd132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vfnmadd132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vfnmadd132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vfnmadd132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vfnmadd132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vfnmadd132nepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vfnmadd132bf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0x9c,0x10]
- vfnmadd132nepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vfnmadd132bf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vfnmadd132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vfnmadd132bf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9c,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfnmadd132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vfnmadd132bf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vfnmadd132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmadd132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9c,0x51,0x7f]
- vfnmadd132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vfnmadd132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmadd132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x9c,0x52,0x80]
- vfnmadd132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vfnmadd132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vfnmadd132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vfnmadd132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vfnmadd132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vfnmadd132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vfnmadd132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vfnmadd132nepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vfnmadd132bf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0x9c,0x10]
- vfnmadd132nepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vfnmadd132bf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vfnmadd132nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vfnmadd132bf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9c,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfnmadd132nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vfnmadd132bf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vfnmadd132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmadd132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9c,0x51,0x7f]
- vfnmadd132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vfnmadd132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmadd132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x9c,0x52,0x80]
- vfnmadd132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vfnmadd132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vfnmadd213bf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xac,0xd4]
- vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2
+ vfnmadd213bf16 %ymm4, %ymm3, %ymm2
-// CHECK: vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vfnmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xac,0xd4]
- vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vfnmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xac,0xd4]
- vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vfnmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vfnmadd213bf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xac,0xd4]
- vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2
+ vfnmadd213bf16 %zmm4, %zmm3, %zmm2
-// CHECK: vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vfnmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xac,0xd4]
- vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vfnmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xac,0xd4]
- vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vfnmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vfnmadd213bf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xac,0xd4]
- vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2
+ vfnmadd213bf16 %xmm4, %xmm3, %xmm2
-// CHECK: vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vfnmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xac,0xd4]
- vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vfnmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xac,0xd4]
- vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vfnmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vfnmadd213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xac,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vfnmadd213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vfnmadd213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vfnmadd213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xac,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vfnmadd213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vfnmadd213nepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vfnmadd213bf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xac,0x10]
- vfnmadd213nepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vfnmadd213bf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vfnmadd213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vfnmadd213bf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xac,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfnmadd213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vfnmadd213bf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vfnmadd213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmadd213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xac,0x51,0x7f]
- vfnmadd213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vfnmadd213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmadd213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xac,0x52,0x80]
- vfnmadd213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vfnmadd213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vfnmadd213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xac,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vfnmadd213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vfnmadd213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vfnmadd213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xac,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vfnmadd213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vfnmadd213nepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vfnmadd213bf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xac,0x10]
- vfnmadd213nepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vfnmadd213bf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vfnmadd213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vfnmadd213bf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xac,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfnmadd213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vfnmadd213bf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vfnmadd213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmadd213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xac,0x51,0x7f]
- vfnmadd213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vfnmadd213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmadd213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xac,0x52,0x80]
- vfnmadd213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vfnmadd213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vfnmadd213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xac,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vfnmadd213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vfnmadd213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vfnmadd213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xac,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vfnmadd213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vfnmadd213nepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vfnmadd213bf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xac,0x10]
- vfnmadd213nepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vfnmadd213bf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vfnmadd213nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vfnmadd213bf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xac,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfnmadd213nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vfnmadd213bf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vfnmadd213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmadd213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xac,0x51,0x7f]
- vfnmadd213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vfnmadd213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmadd213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xac,0x52,0x80]
- vfnmadd213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vfnmadd213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vfnmadd231bf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbc,0xd4]
- vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2
+ vfnmadd231bf16 %ymm4, %ymm3, %ymm2
-// CHECK: vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vfnmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbc,0xd4]
- vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vfnmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbc,0xd4]
- vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vfnmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vfnmadd231bf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbc,0xd4]
- vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2
+ vfnmadd231bf16 %zmm4, %zmm3, %zmm2
-// CHECK: vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vfnmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbc,0xd4]
- vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vfnmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbc,0xd4]
- vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vfnmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vfnmadd231bf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbc,0xd4]
- vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2
+ vfnmadd231bf16 %xmm4, %xmm3, %xmm2
-// CHECK: vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vfnmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbc,0xd4]
- vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vfnmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbc,0xd4]
- vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vfnmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vfnmadd231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vfnmadd231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vfnmadd231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vfnmadd231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vfnmadd231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vfnmadd231nepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vfnmadd231bf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xbc,0x10]
- vfnmadd231nepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vfnmadd231bf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vfnmadd231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vfnmadd231bf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbc,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfnmadd231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vfnmadd231bf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vfnmadd231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmadd231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbc,0x51,0x7f]
- vfnmadd231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vfnmadd231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmadd231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xbc,0x52,0x80]
- vfnmadd231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vfnmadd231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vfnmadd231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vfnmadd231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vfnmadd231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vfnmadd231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vfnmadd231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vfnmadd231nepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vfnmadd231bf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xbc,0x10]
- vfnmadd231nepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vfnmadd231bf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vfnmadd231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vfnmadd231bf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbc,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfnmadd231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vfnmadd231bf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vfnmadd231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmadd231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbc,0x51,0x7f]
- vfnmadd231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vfnmadd231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmadd231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xbc,0x52,0x80]
- vfnmadd231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vfnmadd231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vfnmadd231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vfnmadd231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vfnmadd231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vfnmadd231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vfnmadd231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vfnmadd231nepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vfnmadd231bf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xbc,0x10]
- vfnmadd231nepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vfnmadd231bf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vfnmadd231nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vfnmadd231bf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbc,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfnmadd231nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vfnmadd231bf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vfnmadd231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmadd231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbc,0x51,0x7f]
- vfnmadd231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vfnmadd231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmadd231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xbc,0x52,0x80]
- vfnmadd231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vfnmadd231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vfnmsub132bf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9e,0xd4]
- vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2
+ vfnmsub132bf16 %ymm4, %ymm3, %ymm2
-// CHECK: vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vfnmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9e,0xd4]
- vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vfnmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9e,0xd4]
- vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vfnmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vfnmsub132bf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9e,0xd4]
- vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2
+ vfnmsub132bf16 %zmm4, %zmm3, %zmm2
-// CHECK: vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vfnmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9e,0xd4]
- vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vfnmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9e,0xd4]
- vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vfnmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vfnmsub132bf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9e,0xd4]
- vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2
+ vfnmsub132bf16 %xmm4, %xmm3, %xmm2
-// CHECK: vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vfnmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9e,0xd4]
- vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vfnmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9e,0xd4]
- vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vfnmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vfnmsub132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vfnmsub132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vfnmsub132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vfnmsub132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vfnmsub132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vfnmsub132nepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vfnmsub132bf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0x9e,0x10]
- vfnmsub132nepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vfnmsub132bf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vfnmsub132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vfnmsub132bf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9e,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfnmsub132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vfnmsub132bf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vfnmsub132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmsub132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9e,0x51,0x7f]
- vfnmsub132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vfnmsub132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmsub132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x9e,0x52,0x80]
- vfnmsub132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vfnmsub132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vfnmsub132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vfnmsub132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vfnmsub132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vfnmsub132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vfnmsub132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vfnmsub132nepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vfnmsub132bf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0x9e,0x10]
- vfnmsub132nepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vfnmsub132bf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vfnmsub132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vfnmsub132bf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9e,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfnmsub132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vfnmsub132bf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vfnmsub132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmsub132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9e,0x51,0x7f]
- vfnmsub132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vfnmsub132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmsub132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x9e,0x52,0x80]
- vfnmsub132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vfnmsub132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vfnmsub132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vfnmsub132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vfnmsub132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vfnmsub132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vfnmsub132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vfnmsub132nepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vfnmsub132bf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0x9e,0x10]
- vfnmsub132nepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vfnmsub132bf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vfnmsub132nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vfnmsub132bf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9e,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfnmsub132nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vfnmsub132bf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vfnmsub132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmsub132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9e,0x51,0x7f]
- vfnmsub132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vfnmsub132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmsub132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x9e,0x52,0x80]
- vfnmsub132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vfnmsub132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vfnmsub213bf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xae,0xd4]
- vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2
+ vfnmsub213bf16 %ymm4, %ymm3, %ymm2
-// CHECK: vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vfnmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xae,0xd4]
- vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vfnmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xae,0xd4]
- vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vfnmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vfnmsub213bf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xae,0xd4]
- vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2
+ vfnmsub213bf16 %zmm4, %zmm3, %zmm2
-// CHECK: vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vfnmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xae,0xd4]
- vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vfnmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xae,0xd4]
- vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vfnmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vfnmsub213bf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xae,0xd4]
- vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2
+ vfnmsub213bf16 %xmm4, %xmm3, %xmm2
-// CHECK: vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vfnmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xae,0xd4]
- vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vfnmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xae,0xd4]
- vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vfnmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vfnmsub213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xae,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vfnmsub213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vfnmsub213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vfnmsub213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xae,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vfnmsub213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vfnmsub213nepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vfnmsub213bf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xae,0x10]
- vfnmsub213nepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vfnmsub213bf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vfnmsub213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vfnmsub213bf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xae,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfnmsub213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vfnmsub213bf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vfnmsub213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmsub213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xae,0x51,0x7f]
- vfnmsub213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vfnmsub213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmsub213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xae,0x52,0x80]
- vfnmsub213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vfnmsub213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vfnmsub213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xae,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vfnmsub213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vfnmsub213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vfnmsub213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xae,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vfnmsub213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vfnmsub213nepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vfnmsub213bf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xae,0x10]
- vfnmsub213nepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vfnmsub213bf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vfnmsub213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vfnmsub213bf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xae,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfnmsub213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vfnmsub213bf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vfnmsub213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmsub213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xae,0x51,0x7f]
- vfnmsub213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vfnmsub213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmsub213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xae,0x52,0x80]
- vfnmsub213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vfnmsub213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vfnmsub213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xae,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vfnmsub213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vfnmsub213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vfnmsub213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xae,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vfnmsub213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vfnmsub213nepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vfnmsub213bf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xae,0x10]
- vfnmsub213nepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vfnmsub213bf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vfnmsub213nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vfnmsub213bf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xae,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfnmsub213nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vfnmsub213bf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vfnmsub213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmsub213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xae,0x51,0x7f]
- vfnmsub213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vfnmsub213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmsub213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xae,0x52,0x80]
- vfnmsub213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vfnmsub213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vfnmsub231bf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbe,0xd4]
- vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2
+ vfnmsub231bf16 %ymm4, %ymm3, %ymm2
-// CHECK: vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vfnmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbe,0xd4]
- vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vfnmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbe,0xd4]
- vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vfnmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vfnmsub231bf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbe,0xd4]
- vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2
+ vfnmsub231bf16 %zmm4, %zmm3, %zmm2
-// CHECK: vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vfnmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbe,0xd4]
- vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vfnmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbe,0xd4]
- vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vfnmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vfnmsub231bf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbe,0xd4]
- vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2
+ vfnmsub231bf16 %xmm4, %xmm3, %xmm2
-// CHECK: vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vfnmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbe,0xd4]
- vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vfnmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbe,0xd4]
- vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vfnmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vfnmsub231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vfnmsub231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vfnmsub231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vfnmsub231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vfnmsub231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vfnmsub231nepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vfnmsub231bf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xbe,0x10]
- vfnmsub231nepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vfnmsub231bf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vfnmsub231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vfnmsub231bf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbe,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfnmsub231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vfnmsub231bf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vfnmsub231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmsub231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbe,0x51,0x7f]
- vfnmsub231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vfnmsub231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vfnmsub231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xbe,0x52,0x80]
- vfnmsub231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vfnmsub231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vfnmsub231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vfnmsub231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vfnmsub231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vfnmsub231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vfnmsub231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vfnmsub231nepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vfnmsub231bf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xbe,0x10]
- vfnmsub231nepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vfnmsub231bf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vfnmsub231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vfnmsub231bf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbe,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfnmsub231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vfnmsub231bf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vfnmsub231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmsub231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbe,0x51,0x7f]
- vfnmsub231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vfnmsub231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vfnmsub231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xbe,0x52,0x80]
- vfnmsub231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vfnmsub231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vfnmsub231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vfnmsub231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vfnmsub231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vfnmsub231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vfnmsub231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vfnmsub231nepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vfnmsub231bf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xbe,0x10]
- vfnmsub231nepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vfnmsub231bf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vfnmsub231nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vfnmsub231bf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbe,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfnmsub231nepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vfnmsub231bf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vfnmsub231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmsub231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbe,0x51,0x7f]
- vfnmsub231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vfnmsub231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vfnmsub231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xbe,0x52,0x80]
- vfnmsub231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vfnmsub231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vfpclasspbf16 $123, %zmm3, %k5
+// CHECK: vfpclassbf16 $123, %zmm3, %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x66,0xeb,0x7b]
- vfpclasspbf16 $123, %zmm3, %k5
+ vfpclassbf16 $123, %zmm3, %k5
-// CHECK: vfpclasspbf16 $123, %zmm3, %k5 {%k7}
+// CHECK: vfpclassbf16 $123, %zmm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x66,0xeb,0x7b]
- vfpclasspbf16 $123, %zmm3, %k5 {%k7}
+ vfpclassbf16 $123, %zmm3, %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, %ymm3, %k5
+// CHECK: vfpclassbf16 $123, %ymm3, %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x66,0xeb,0x7b]
- vfpclasspbf16 $123, %ymm3, %k5
+ vfpclassbf16 $123, %ymm3, %k5
-// CHECK: vfpclasspbf16 $123, %ymm3, %k5 {%k7}
+// CHECK: vfpclassbf16 $123, %ymm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x66,0xeb,0x7b]
- vfpclasspbf16 $123, %ymm3, %k5 {%k7}
+ vfpclassbf16 $123, %ymm3, %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, %xmm3, %k5
+// CHECK: vfpclassbf16 $123, %xmm3, %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0xeb,0x7b]
- vfpclasspbf16 $123, %xmm3, %k5
+ vfpclassbf16 $123, %xmm3, %k5
-// CHECK: vfpclasspbf16 $123, %xmm3, %k5 {%k7}
+// CHECK: vfpclassbf16 $123, %xmm3, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0xeb,0x7b]
- vfpclasspbf16 $123, %xmm3, %k5 {%k7}
+ vfpclassbf16 $123, %xmm3, %k5 {%k7}
-// CHECK: vfpclasspbf16x $123, 268435456(%esp,%esi,8), %k5
+// CHECK: vfpclassbf16x $123, 268435456(%esp,%esi,8), %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vfpclasspbf16x $123, 268435456(%esp,%esi,8), %k5
+ vfpclassbf16x $123, 268435456(%esp,%esi,8), %k5
-// CHECK: vfpclasspbf16x $123, 291(%edi,%eax,4), %k5 {%k7}
+// CHECK: vfpclassbf16x $123, 291(%edi,%eax,4), %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0xac,0x87,0x23,0x01,0x00,0x00,0x7b]
- vfpclasspbf16x $123, 291(%edi,%eax,4), %k5 {%k7}
+ vfpclassbf16x $123, 291(%edi,%eax,4), %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, (%eax){1to8}, %k5
+// CHECK: vfpclassbf16 $123, (%eax){1to8}, %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x66,0x28,0x7b]
- vfpclasspbf16 $123, (%eax){1to8}, %k5
+ vfpclassbf16 $123, (%eax){1to8}, %k5
-// CHECK: vfpclasspbf16x $123, -512(,%ebp,2), %k5
+// CHECK: vfpclassbf16x $123, -512(,%ebp,2), %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vfpclasspbf16x $123, -512(,%ebp,2), %k5
+ vfpclassbf16x $123, -512(,%ebp,2), %k5
-// CHECK: vfpclasspbf16x $123, 2032(%ecx), %k5 {%k7}
+// CHECK: vfpclassbf16x $123, 2032(%ecx), %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0x69,0x7f,0x7b]
- vfpclasspbf16x $123, 2032(%ecx), %k5 {%k7}
+ vfpclassbf16x $123, 2032(%ecx), %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, -256(%edx){1to8}, %k5 {%k7}
+// CHECK: vfpclassbf16 $123, -256(%edx){1to8}, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x1f,0x66,0x6a,0x80,0x7b]
- vfpclasspbf16 $123, -256(%edx){1to8}, %k5 {%k7}
+ vfpclassbf16 $123, -256(%edx){1to8}, %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, (%eax){1to16}, %k5
+// CHECK: vfpclassbf16 $123, (%eax){1to16}, %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x66,0x28,0x7b]
- vfpclasspbf16 $123, (%eax){1to16}, %k5
+ vfpclassbf16 $123, (%eax){1to16}, %k5
-// CHECK: vfpclasspbf16y $123, -1024(,%ebp,2), %k5
+// CHECK: vfpclassbf16y $123, -1024(,%ebp,2), %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x66,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vfpclasspbf16y $123, -1024(,%ebp,2), %k5
+ vfpclassbf16y $123, -1024(,%ebp,2), %k5
-// CHECK: vfpclasspbf16y $123, 4064(%ecx), %k5 {%k7}
+// CHECK: vfpclassbf16y $123, 4064(%ecx), %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x66,0x69,0x7f,0x7b]
- vfpclasspbf16y $123, 4064(%ecx), %k5 {%k7}
+ vfpclassbf16y $123, 4064(%ecx), %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, -256(%edx){1to16}, %k5 {%k7}
+// CHECK: vfpclassbf16 $123, -256(%edx){1to16}, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x3f,0x66,0x6a,0x80,0x7b]
- vfpclasspbf16 $123, -256(%edx){1to16}, %k5 {%k7}
+ vfpclassbf16 $123, -256(%edx){1to16}, %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, (%eax){1to32}, %k5
+// CHECK: vfpclassbf16 $123, (%eax){1to32}, %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x66,0x28,0x7b]
- vfpclasspbf16 $123, (%eax){1to32}, %k5
+ vfpclassbf16 $123, (%eax){1to32}, %k5
-// CHECK: vfpclasspbf16z $123, -2048(,%ebp,2), %k5
+// CHECK: vfpclassbf16z $123, -2048(,%ebp,2), %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x66,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vfpclasspbf16z $123, -2048(,%ebp,2), %k5
+ vfpclassbf16z $123, -2048(,%ebp,2), %k5
-// CHECK: vfpclasspbf16z $123, 8128(%ecx), %k5 {%k7}
+// CHECK: vfpclassbf16z $123, 8128(%ecx), %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x66,0x69,0x7f,0x7b]
- vfpclasspbf16z $123, 8128(%ecx), %k5 {%k7}
+ vfpclassbf16z $123, 8128(%ecx), %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, -256(%edx){1to32}, %k5 {%k7}
+// CHECK: vfpclassbf16 $123, -256(%edx){1to32}, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x5f,0x66,0x6a,0x80,0x7b]
- vfpclasspbf16 $123, -256(%edx){1to32}, %k5 {%k7}
+ vfpclassbf16 $123, -256(%edx){1to32}, %k5 {%k7}
-// CHECK: vgetexppbf16 %xmm3, %xmm2
+// CHECK: vgetexpbf16 %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x42,0xd3]
- vgetexppbf16 %xmm3, %xmm2
+ vgetexpbf16 %xmm3, %xmm2
-// CHECK: vgetexppbf16 %xmm3, %xmm2 {%k7}
+// CHECK: vgetexpbf16 %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x42,0xd3]
- vgetexppbf16 %xmm3, %xmm2 {%k7}
+ vgetexpbf16 %xmm3, %xmm2 {%k7}
-// CHECK: vgetexppbf16 %xmm3, %xmm2 {%k7} {z}
+// CHECK: vgetexpbf16 %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x42,0xd3]
- vgetexppbf16 %xmm3, %xmm2 {%k7} {z}
+ vgetexpbf16 %xmm3, %xmm2 {%k7} {z}
-// CHECK: vgetexppbf16 %zmm3, %zmm2
+// CHECK: vgetexpbf16 %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x42,0xd3]
- vgetexppbf16 %zmm3, %zmm2
+ vgetexpbf16 %zmm3, %zmm2
-// CHECK: vgetexppbf16 %zmm3, %zmm2 {%k7}
+// CHECK: vgetexpbf16 %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x42,0xd3]
- vgetexppbf16 %zmm3, %zmm2 {%k7}
+ vgetexpbf16 %zmm3, %zmm2 {%k7}
-// CHECK: vgetexppbf16 %zmm3, %zmm2 {%k7} {z}
+// CHECK: vgetexpbf16 %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x42,0xd3]
- vgetexppbf16 %zmm3, %zmm2 {%k7} {z}
+ vgetexpbf16 %zmm3, %zmm2 {%k7} {z}
-// CHECK: vgetexppbf16 %ymm3, %ymm2
+// CHECK: vgetexpbf16 %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x42,0xd3]
- vgetexppbf16 %ymm3, %ymm2
+ vgetexpbf16 %ymm3, %ymm2
-// CHECK: vgetexppbf16 %ymm3, %ymm2 {%k7}
+// CHECK: vgetexpbf16 %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x42,0xd3]
- vgetexppbf16 %ymm3, %ymm2 {%k7}
+ vgetexpbf16 %ymm3, %ymm2 {%k7}
-// CHECK: vgetexppbf16 %ymm3, %ymm2 {%k7} {z}
+// CHECK: vgetexpbf16 %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x42,0xd3]
- vgetexppbf16 %ymm3, %ymm2 {%k7} {z}
+ vgetexpbf16 %ymm3, %ymm2 {%k7} {z}
-// CHECK: vgetexppbf16 268435456(%esp,%esi,8), %xmm2
+// CHECK: vgetexpbf16 268435456(%esp,%esi,8), %xmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x42,0x94,0xf4,0x00,0x00,0x00,0x10]
- vgetexppbf16 268435456(%esp,%esi,8), %xmm2
+ vgetexpbf16 268435456(%esp,%esi,8), %xmm2
-// CHECK: vgetexppbf16 291(%edi,%eax,4), %xmm2 {%k7}
+// CHECK: vgetexpbf16 291(%edi,%eax,4), %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x42,0x94,0x87,0x23,0x01,0x00,0x00]
- vgetexppbf16 291(%edi,%eax,4), %xmm2 {%k7}
+ vgetexpbf16 291(%edi,%eax,4), %xmm2 {%k7}
-// CHECK: vgetexppbf16 (%eax){1to8}, %xmm2
+// CHECK: vgetexpbf16 (%eax){1to8}, %xmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x18,0x42,0x10]
- vgetexppbf16 (%eax){1to8}, %xmm2
+ vgetexpbf16 (%eax){1to8}, %xmm2
-// CHECK: vgetexppbf16 -512(,%ebp,2), %xmm2
+// CHECK: vgetexpbf16 -512(,%ebp,2), %xmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x42,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vgetexppbf16 -512(,%ebp,2), %xmm2
+ vgetexpbf16 -512(,%ebp,2), %xmm2
-// CHECK: vgetexppbf16 2032(%ecx), %xmm2 {%k7} {z}
+// CHECK: vgetexpbf16 2032(%ecx), %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x42,0x51,0x7f]
- vgetexppbf16 2032(%ecx), %xmm2 {%k7} {z}
+ vgetexpbf16 2032(%ecx), %xmm2 {%k7} {z}
-// CHECK: vgetexppbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
+// CHECK: vgetexpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0x9f,0x42,0x52,0x80]
- vgetexppbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
+ vgetexpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
-// CHECK: vgetexppbf16 268435456(%esp,%esi,8), %ymm2
+// CHECK: vgetexpbf16 268435456(%esp,%esi,8), %ymm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x42,0x94,0xf4,0x00,0x00,0x00,0x10]
- vgetexppbf16 268435456(%esp,%esi,8), %ymm2
+ vgetexpbf16 268435456(%esp,%esi,8), %ymm2
-// CHECK: vgetexppbf16 291(%edi,%eax,4), %ymm2 {%k7}
+// CHECK: vgetexpbf16 291(%edi,%eax,4), %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x42,0x94,0x87,0x23,0x01,0x00,0x00]
- vgetexppbf16 291(%edi,%eax,4), %ymm2 {%k7}
+ vgetexpbf16 291(%edi,%eax,4), %ymm2 {%k7}
-// CHECK: vgetexppbf16 (%eax){1to16}, %ymm2
+// CHECK: vgetexpbf16 (%eax){1to16}, %ymm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x38,0x42,0x10]
- vgetexppbf16 (%eax){1to16}, %ymm2
+ vgetexpbf16 (%eax){1to16}, %ymm2
-// CHECK: vgetexppbf16 -1024(,%ebp,2), %ymm2
+// CHECK: vgetexpbf16 -1024(,%ebp,2), %ymm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x42,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vgetexppbf16 -1024(,%ebp,2), %ymm2
+ vgetexpbf16 -1024(,%ebp,2), %ymm2
-// CHECK: vgetexppbf16 4064(%ecx), %ymm2 {%k7} {z}
+// CHECK: vgetexpbf16 4064(%ecx), %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x42,0x51,0x7f]
- vgetexppbf16 4064(%ecx), %ymm2 {%k7} {z}
+ vgetexpbf16 4064(%ecx), %ymm2 {%k7} {z}
-// CHECK: vgetexppbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
+// CHECK: vgetexpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0xbf,0x42,0x52,0x80]
- vgetexppbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
+ vgetexpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
-// CHECK: vgetexppbf16 268435456(%esp,%esi,8), %zmm2
+// CHECK: vgetexpbf16 268435456(%esp,%esi,8), %zmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x42,0x94,0xf4,0x00,0x00,0x00,0x10]
- vgetexppbf16 268435456(%esp,%esi,8), %zmm2
+ vgetexpbf16 268435456(%esp,%esi,8), %zmm2
-// CHECK: vgetexppbf16 291(%edi,%eax,4), %zmm2 {%k7}
+// CHECK: vgetexpbf16 291(%edi,%eax,4), %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x42,0x94,0x87,0x23,0x01,0x00,0x00]
- vgetexppbf16 291(%edi,%eax,4), %zmm2 {%k7}
+ vgetexpbf16 291(%edi,%eax,4), %zmm2 {%k7}
-// CHECK: vgetexppbf16 (%eax){1to32}, %zmm2
+// CHECK: vgetexpbf16 (%eax){1to32}, %zmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x58,0x42,0x10]
- vgetexppbf16 (%eax){1to32}, %zmm2
+ vgetexpbf16 (%eax){1to32}, %zmm2
-// CHECK: vgetexppbf16 -2048(,%ebp,2), %zmm2
+// CHECK: vgetexpbf16 -2048(,%ebp,2), %zmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x42,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vgetexppbf16 -2048(,%ebp,2), %zmm2
+ vgetexpbf16 -2048(,%ebp,2), %zmm2
-// CHECK: vgetexppbf16 8128(%ecx), %zmm2 {%k7} {z}
+// CHECK: vgetexpbf16 8128(%ecx), %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x42,0x51,0x7f]
- vgetexppbf16 8128(%ecx), %zmm2 {%k7} {z}
+ vgetexpbf16 8128(%ecx), %zmm2 {%k7} {z}
-// CHECK: vgetexppbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
+// CHECK: vgetexpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0xdf,0x42,0x52,0x80]
- vgetexppbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
+ vgetexpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, %zmm3, %zmm2
+// CHECK: vgetmantbf16 $123, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x26,0xd3,0x7b]
- vgetmantpbf16 $123, %zmm3, %zmm2
+ vgetmantbf16 $123, %zmm3, %zmm2
-// CHECK: vgetmantpbf16 $123, %zmm3, %zmm2 {%k7}
+// CHECK: vgetmantbf16 $123, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x26,0xd3,0x7b]
- vgetmantpbf16 $123, %zmm3, %zmm2 {%k7}
+ vgetmantbf16 $123, %zmm3, %zmm2 {%k7}
-// CHECK: vgetmantpbf16 $123, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vgetmantbf16 $123, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x26,0xd3,0x7b]
- vgetmantpbf16 $123, %zmm3, %zmm2 {%k7} {z}
+ vgetmantbf16 $123, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, %ymm3, %ymm2
+// CHECK: vgetmantbf16 $123, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x26,0xd3,0x7b]
- vgetmantpbf16 $123, %ymm3, %ymm2
+ vgetmantbf16 $123, %ymm3, %ymm2
-// CHECK: vgetmantpbf16 $123, %ymm3, %ymm2 {%k7}
+// CHECK: vgetmantbf16 $123, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x26,0xd3,0x7b]
- vgetmantpbf16 $123, %ymm3, %ymm2 {%k7}
+ vgetmantbf16 $123, %ymm3, %ymm2 {%k7}
-// CHECK: vgetmantpbf16 $123, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vgetmantbf16 $123, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x26,0xd3,0x7b]
- vgetmantpbf16 $123, %ymm3, %ymm2 {%k7} {z}
+ vgetmantbf16 $123, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, %xmm3, %xmm2
+// CHECK: vgetmantbf16 $123, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x26,0xd3,0x7b]
- vgetmantpbf16 $123, %xmm3, %xmm2
+ vgetmantbf16 $123, %xmm3, %xmm2
-// CHECK: vgetmantpbf16 $123, %xmm3, %xmm2 {%k7}
+// CHECK: vgetmantbf16 $123, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x26,0xd3,0x7b]
- vgetmantpbf16 $123, %xmm3, %xmm2 {%k7}
+ vgetmantbf16 $123, %xmm3, %xmm2 {%k7}
-// CHECK: vgetmantpbf16 $123, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vgetmantbf16 $123, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x26,0xd3,0x7b]
- vgetmantpbf16 $123, %xmm3, %xmm2 {%k7} {z}
+ vgetmantbf16 $123, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, 268435456(%esp,%esi,8), %xmm2
+// CHECK: vgetmantbf16 $123, 268435456(%esp,%esi,8), %xmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vgetmantpbf16 $123, 268435456(%esp,%esi,8), %xmm2
+ vgetmantbf16 $123, 268435456(%esp,%esi,8), %xmm2
-// CHECK: vgetmantpbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
+// CHECK: vgetmantbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vgetmantpbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
+ vgetmantbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
-// CHECK: vgetmantpbf16 $123, (%eax){1to8}, %xmm2
+// CHECK: vgetmantbf16 $123, (%eax){1to8}, %xmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x26,0x10,0x7b]
- vgetmantpbf16 $123, (%eax){1to8}, %xmm2
+ vgetmantbf16 $123, (%eax){1to8}, %xmm2
-// CHECK: vgetmantpbf16 $123, -512(,%ebp,2), %xmm2
+// CHECK: vgetmantbf16 $123, -512(,%ebp,2), %xmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x26,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vgetmantpbf16 $123, -512(,%ebp,2), %xmm2
+ vgetmantbf16 $123, -512(,%ebp,2), %xmm2
-// CHECK: vgetmantpbf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
+// CHECK: vgetmantbf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x26,0x51,0x7f,0x7b]
- vgetmantpbf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
+ vgetmantbf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
+// CHECK: vgetmantbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0x9f,0x26,0x52,0x80,0x7b]
- vgetmantpbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
+ vgetmantbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, 268435456(%esp,%esi,8), %ymm2
+// CHECK: vgetmantbf16 $123, 268435456(%esp,%esi,8), %ymm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vgetmantpbf16 $123, 268435456(%esp,%esi,8), %ymm2
+ vgetmantbf16 $123, 268435456(%esp,%esi,8), %ymm2
-// CHECK: vgetmantpbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
+// CHECK: vgetmantbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vgetmantpbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
+ vgetmantbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
-// CHECK: vgetmantpbf16 $123, (%eax){1to16}, %ymm2
+// CHECK: vgetmantbf16 $123, (%eax){1to16}, %ymm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x26,0x10,0x7b]
- vgetmantpbf16 $123, (%eax){1to16}, %ymm2
+ vgetmantbf16 $123, (%eax){1to16}, %ymm2
-// CHECK: vgetmantpbf16 $123, -1024(,%ebp,2), %ymm2
+// CHECK: vgetmantbf16 $123, -1024(,%ebp,2), %ymm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x26,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vgetmantpbf16 $123, -1024(,%ebp,2), %ymm2
+ vgetmantbf16 $123, -1024(,%ebp,2), %ymm2
-// CHECK: vgetmantpbf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
+// CHECK: vgetmantbf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x26,0x51,0x7f,0x7b]
- vgetmantpbf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
+ vgetmantbf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
+// CHECK: vgetmantbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xbf,0x26,0x52,0x80,0x7b]
- vgetmantpbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
+ vgetmantbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, 268435456(%esp,%esi,8), %zmm2
+// CHECK: vgetmantbf16 $123, 268435456(%esp,%esi,8), %zmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vgetmantpbf16 $123, 268435456(%esp,%esi,8), %zmm2
+ vgetmantbf16 $123, 268435456(%esp,%esi,8), %zmm2
-// CHECK: vgetmantpbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
+// CHECK: vgetmantbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vgetmantpbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
+ vgetmantbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
-// CHECK: vgetmantpbf16 $123, (%eax){1to32}, %zmm2
+// CHECK: vgetmantbf16 $123, (%eax){1to32}, %zmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x26,0x10,0x7b]
- vgetmantpbf16 $123, (%eax){1to32}, %zmm2
+ vgetmantbf16 $123, (%eax){1to32}, %zmm2
-// CHECK: vgetmantpbf16 $123, -2048(,%ebp,2), %zmm2
+// CHECK: vgetmantbf16 $123, -2048(,%ebp,2), %zmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x26,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vgetmantpbf16 $123, -2048(,%ebp,2), %zmm2
+ vgetmantbf16 $123, -2048(,%ebp,2), %zmm2
-// CHECK: vgetmantpbf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
+// CHECK: vgetmantbf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x26,0x51,0x7f,0x7b]
- vgetmantpbf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
+ vgetmantbf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
+// CHECK: vgetmantbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xdf,0x26,0x52,0x80,0x7b]
- vgetmantpbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
+ vgetmantbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
-// CHECK: vmaxpbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vmaxbf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5f,0xd4]
- vmaxpbf16 %ymm4, %ymm3, %ymm2
+ vmaxbf16 %ymm4, %ymm3, %ymm2
-// CHECK: vmaxpbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vmaxbf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5f,0xd4]
- vmaxpbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vmaxbf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vmaxpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vmaxbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5f,0xd4]
- vmaxpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vmaxbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vmaxpbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vmaxbf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5f,0xd4]
- vmaxpbf16 %zmm4, %zmm3, %zmm2
+ vmaxbf16 %zmm4, %zmm3, %zmm2
-// CHECK: vmaxpbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vmaxbf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5f,0xd4]
- vmaxpbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vmaxbf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vmaxpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vmaxbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5f,0xd4]
- vmaxpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vmaxbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vmaxpbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vmaxbf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5f,0xd4]
- vmaxpbf16 %xmm4, %xmm3, %xmm2
+ vmaxbf16 %xmm4, %xmm3, %xmm2
-// CHECK: vmaxpbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vmaxbf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5f,0xd4]
- vmaxpbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vmaxbf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vmaxpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vmaxbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5f,0xd4]
- vmaxpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vmaxbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vmaxpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vmaxbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10]
- vmaxpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vmaxbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vmaxpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vmaxbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00]
- vmaxpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vmaxbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vmaxpbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vmaxbf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5f,0x10]
- vmaxpbf16 (%eax){1to32}, %zmm3, %zmm2
+ vmaxbf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vmaxpbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vmaxbf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5f,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vmaxpbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vmaxbf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vmaxpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vmaxbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5f,0x51,0x7f]
- vmaxpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vmaxbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vmaxpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vmaxbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5f,0x52,0x80]
- vmaxpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vmaxbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vmaxpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vmaxbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10]
- vmaxpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vmaxbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vmaxpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vmaxbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00]
- vmaxpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vmaxbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vmaxpbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vmaxbf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5f,0x10]
- vmaxpbf16 (%eax){1to16}, %ymm3, %ymm2
+ vmaxbf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vmaxpbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vmaxbf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5f,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vmaxpbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vmaxbf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vmaxpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vmaxbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5f,0x51,0x7f]
- vmaxpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vmaxbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vmaxpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vmaxbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5f,0x52,0x80]
- vmaxpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vmaxbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vmaxpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vmaxbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10]
- vmaxpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vmaxbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vmaxpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vmaxbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00]
- vmaxpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vmaxbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vmaxpbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vmaxbf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5f,0x10]
- vmaxpbf16 (%eax){1to8}, %xmm3, %xmm2
+ vmaxbf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vmaxpbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vmaxbf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5f,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vmaxpbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vmaxbf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vmaxpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vmaxbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5f,0x51,0x7f]
- vmaxpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vmaxbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vmaxpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vmaxbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5f,0x52,0x80]
- vmaxpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vmaxbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vminpbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vminbf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5d,0xd4]
- vminpbf16 %ymm4, %ymm3, %ymm2
+ vminbf16 %ymm4, %ymm3, %ymm2
-// CHECK: vminpbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vminbf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5d,0xd4]
- vminpbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vminbf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vminpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vminbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5d,0xd4]
- vminpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vminbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vminpbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vminbf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5d,0xd4]
- vminpbf16 %zmm4, %zmm3, %zmm2
+ vminbf16 %zmm4, %zmm3, %zmm2
-// CHECK: vminpbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vminbf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5d,0xd4]
- vminpbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vminbf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vminpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vminbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5d,0xd4]
- vminpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vminbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vminpbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vminbf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5d,0xd4]
- vminpbf16 %xmm4, %xmm3, %xmm2
+ vminbf16 %xmm4, %xmm3, %xmm2
-// CHECK: vminpbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vminbf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5d,0xd4]
- vminpbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vminbf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vminpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vminbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5d,0xd4]
- vminpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vminbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vminpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vminbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10]
- vminpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vminbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vminpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vminbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00]
- vminpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vminbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vminpbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vminbf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5d,0x10]
- vminpbf16 (%eax){1to32}, %zmm3, %zmm2
+ vminbf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vminpbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vminbf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5d,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vminpbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vminbf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vminpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vminbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5d,0x51,0x7f]
- vminpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vminbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vminpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vminbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5d,0x52,0x80]
- vminpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vminbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vminpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vminbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10]
- vminpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vminbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vminpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vminbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00]
- vminpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vminbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vminpbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vminbf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5d,0x10]
- vminpbf16 (%eax){1to16}, %ymm3, %ymm2
+ vminbf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vminpbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vminbf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5d,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vminpbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vminbf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vminpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vminbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5d,0x51,0x7f]
- vminpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vminbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vminpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vminbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5d,0x52,0x80]
- vminpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vminbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vminpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vminbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10]
- vminpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vminbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vminpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vminbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00]
- vminpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vminbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vminpbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vminbf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5d,0x10]
- vminpbf16 (%eax){1to8}, %xmm3, %xmm2
+ vminbf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vminpbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vminbf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5d,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vminpbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vminbf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vminpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vminbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5d,0x51,0x7f]
- vminpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vminbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vminpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vminbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5d,0x52,0x80]
- vminpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vminbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vmulnepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vmulbf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x59,0xd4]
- vmulnepbf16 %ymm4, %ymm3, %ymm2
+ vmulbf16 %ymm4, %ymm3, %ymm2
-// CHECK: vmulnepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vmulbf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x59,0xd4]
- vmulnepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vmulbf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vmulnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vmulbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x59,0xd4]
- vmulnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vmulbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vmulnepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vmulbf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x59,0xd4]
- vmulnepbf16 %zmm4, %zmm3, %zmm2
+ vmulbf16 %zmm4, %zmm3, %zmm2
-// CHECK: vmulnepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vmulbf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x59,0xd4]
- vmulnepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vmulbf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vmulnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vmulbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x59,0xd4]
- vmulnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vmulbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vmulnepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vmulbf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x59,0xd4]
- vmulnepbf16 %xmm4, %xmm3, %xmm2
+ vmulbf16 %xmm4, %xmm3, %xmm2
-// CHECK: vmulnepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vmulbf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x59,0xd4]
- vmulnepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vmulbf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vmulnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vmulbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x59,0xd4]
- vmulnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vmulbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vmulnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vmulbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x59,0x94,0xf4,0x00,0x00,0x00,0x10]
- vmulnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vmulbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vmulnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vmulbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x59,0x94,0x87,0x23,0x01,0x00,0x00]
- vmulnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vmulbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vmulnepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vmulbf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x58,0x59,0x10]
- vmulnepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vmulbf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vmulnepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vmulbf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x59,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vmulnepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vmulbf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vmulnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vmulbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x59,0x51,0x7f]
- vmulnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vmulbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vmulnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vmulbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x59,0x52,0x80]
- vmulnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vmulbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vmulnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vmulbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x59,0x94,0xf4,0x00,0x00,0x00,0x10]
- vmulnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vmulbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vmulnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vmulbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x59,0x94,0x87,0x23,0x01,0x00,0x00]
- vmulnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vmulbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vmulnepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vmulbf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x38,0x59,0x10]
- vmulnepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vmulbf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vmulnepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vmulbf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x59,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vmulnepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vmulbf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vmulnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vmulbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x59,0x51,0x7f]
- vmulnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vmulbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vmulnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vmulbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x59,0x52,0x80]
- vmulnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vmulbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vmulnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vmulbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x59,0x94,0xf4,0x00,0x00,0x00,0x10]
- vmulnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vmulbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vmulnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vmulbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x59,0x94,0x87,0x23,0x01,0x00,0x00]
- vmulnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vmulbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vmulnepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vmulbf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x18,0x59,0x10]
- vmulnepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vmulbf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vmulnepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vmulbf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x59,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vmulnepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vmulbf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vmulnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vmulbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x59,0x51,0x7f]
- vmulnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vmulbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vmulnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vmulbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x59,0x52,0x80]
- vmulnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vmulbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vrcppbf16 %xmm3, %xmm2
+// CHECK: vrcpbf16 %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4c,0xd3]
- vrcppbf16 %xmm3, %xmm2
+ vrcpbf16 %xmm3, %xmm2
-// CHECK: vrcppbf16 %xmm3, %xmm2 {%k7}
+// CHECK: vrcpbf16 %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4c,0xd3]
- vrcppbf16 %xmm3, %xmm2 {%k7}
+ vrcpbf16 %xmm3, %xmm2 {%k7}
-// CHECK: vrcppbf16 %xmm3, %xmm2 {%k7} {z}
+// CHECK: vrcpbf16 %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4c,0xd3]
- vrcppbf16 %xmm3, %xmm2 {%k7} {z}
+ vrcpbf16 %xmm3, %xmm2 {%k7} {z}
-// CHECK: vrcppbf16 %zmm3, %zmm2
+// CHECK: vrcpbf16 %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4c,0xd3]
- vrcppbf16 %zmm3, %zmm2
+ vrcpbf16 %zmm3, %zmm2
-// CHECK: vrcppbf16 %zmm3, %zmm2 {%k7}
+// CHECK: vrcpbf16 %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4c,0xd3]
- vrcppbf16 %zmm3, %zmm2 {%k7}
+ vrcpbf16 %zmm3, %zmm2 {%k7}
-// CHECK: vrcppbf16 %zmm3, %zmm2 {%k7} {z}
+// CHECK: vrcpbf16 %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4c,0xd3]
- vrcppbf16 %zmm3, %zmm2 {%k7} {z}
+ vrcpbf16 %zmm3, %zmm2 {%k7} {z}
-// CHECK: vrcppbf16 %ymm3, %ymm2
+// CHECK: vrcpbf16 %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4c,0xd3]
- vrcppbf16 %ymm3, %ymm2
+ vrcpbf16 %ymm3, %ymm2
-// CHECK: vrcppbf16 %ymm3, %ymm2 {%k7}
+// CHECK: vrcpbf16 %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4c,0xd3]
- vrcppbf16 %ymm3, %ymm2 {%k7}
+ vrcpbf16 %ymm3, %ymm2 {%k7}
-// CHECK: vrcppbf16 %ymm3, %ymm2 {%k7} {z}
+// CHECK: vrcpbf16 %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4c,0xd3]
- vrcppbf16 %ymm3, %ymm2 {%k7} {z}
+ vrcpbf16 %ymm3, %ymm2 {%k7} {z}
-// CHECK: vrcppbf16 268435456(%esp,%esi,8), %xmm2
+// CHECK: vrcpbf16 268435456(%esp,%esi,8), %xmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vrcppbf16 268435456(%esp,%esi,8), %xmm2
+ vrcpbf16 268435456(%esp,%esi,8), %xmm2
-// CHECK: vrcppbf16 291(%edi,%eax,4), %xmm2 {%k7}
+// CHECK: vrcpbf16 291(%edi,%eax,4), %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00]
- vrcppbf16 291(%edi,%eax,4), %xmm2 {%k7}
+ vrcpbf16 291(%edi,%eax,4), %xmm2 {%k7}
-// CHECK: vrcppbf16 (%eax){1to8}, %xmm2
+// CHECK: vrcpbf16 (%eax){1to8}, %xmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x18,0x4c,0x10]
- vrcppbf16 (%eax){1to8}, %xmm2
+ vrcpbf16 (%eax){1to8}, %xmm2
-// CHECK: vrcppbf16 -512(,%ebp,2), %xmm2
+// CHECK: vrcpbf16 -512(,%ebp,2), %xmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4c,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vrcppbf16 -512(,%ebp,2), %xmm2
+ vrcpbf16 -512(,%ebp,2), %xmm2
-// CHECK: vrcppbf16 2032(%ecx), %xmm2 {%k7} {z}
+// CHECK: vrcpbf16 2032(%ecx), %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4c,0x51,0x7f]
- vrcppbf16 2032(%ecx), %xmm2 {%k7} {z}
+ vrcpbf16 2032(%ecx), %xmm2 {%k7} {z}
-// CHECK: vrcppbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
+// CHECK: vrcpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0x9f,0x4c,0x52,0x80]
- vrcppbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
+ vrcpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
-// CHECK: vrcppbf16 268435456(%esp,%esi,8), %ymm2
+// CHECK: vrcpbf16 268435456(%esp,%esi,8), %ymm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vrcppbf16 268435456(%esp,%esi,8), %ymm2
+ vrcpbf16 268435456(%esp,%esi,8), %ymm2
-// CHECK: vrcppbf16 291(%edi,%eax,4), %ymm2 {%k7}
+// CHECK: vrcpbf16 291(%edi,%eax,4), %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00]
- vrcppbf16 291(%edi,%eax,4), %ymm2 {%k7}
+ vrcpbf16 291(%edi,%eax,4), %ymm2 {%k7}
-// CHECK: vrcppbf16 (%eax){1to16}, %ymm2
+// CHECK: vrcpbf16 (%eax){1to16}, %ymm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x38,0x4c,0x10]
- vrcppbf16 (%eax){1to16}, %ymm2
+ vrcpbf16 (%eax){1to16}, %ymm2
-// CHECK: vrcppbf16 -1024(,%ebp,2), %ymm2
+// CHECK: vrcpbf16 -1024(,%ebp,2), %ymm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4c,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vrcppbf16 -1024(,%ebp,2), %ymm2
+ vrcpbf16 -1024(,%ebp,2), %ymm2
-// CHECK: vrcppbf16 4064(%ecx), %ymm2 {%k7} {z}
+// CHECK: vrcpbf16 4064(%ecx), %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4c,0x51,0x7f]
- vrcppbf16 4064(%ecx), %ymm2 {%k7} {z}
+ vrcpbf16 4064(%ecx), %ymm2 {%k7} {z}
-// CHECK: vrcppbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
+// CHECK: vrcpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0xbf,0x4c,0x52,0x80]
- vrcppbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
+ vrcpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
-// CHECK: vrcppbf16 268435456(%esp,%esi,8), %zmm2
+// CHECK: vrcpbf16 268435456(%esp,%esi,8), %zmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vrcppbf16 268435456(%esp,%esi,8), %zmm2
+ vrcpbf16 268435456(%esp,%esi,8), %zmm2
-// CHECK: vrcppbf16 291(%edi,%eax,4), %zmm2 {%k7}
+// CHECK: vrcpbf16 291(%edi,%eax,4), %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00]
- vrcppbf16 291(%edi,%eax,4), %zmm2 {%k7}
+ vrcpbf16 291(%edi,%eax,4), %zmm2 {%k7}
-// CHECK: vrcppbf16 (%eax){1to32}, %zmm2
+// CHECK: vrcpbf16 (%eax){1to32}, %zmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x58,0x4c,0x10]
- vrcppbf16 (%eax){1to32}, %zmm2
+ vrcpbf16 (%eax){1to32}, %zmm2
-// CHECK: vrcppbf16 -2048(,%ebp,2), %zmm2
+// CHECK: vrcpbf16 -2048(,%ebp,2), %zmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4c,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vrcppbf16 -2048(,%ebp,2), %zmm2
+ vrcpbf16 -2048(,%ebp,2), %zmm2
-// CHECK: vrcppbf16 8128(%ecx), %zmm2 {%k7} {z}
+// CHECK: vrcpbf16 8128(%ecx), %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4c,0x51,0x7f]
- vrcppbf16 8128(%ecx), %zmm2 {%k7} {z}
+ vrcpbf16 8128(%ecx), %zmm2 {%k7} {z}
-// CHECK: vrcppbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
+// CHECK: vrcpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0xdf,0x4c,0x52,0x80]
- vrcppbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
+ vrcpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
-// CHECK: vreducenepbf16 $123, %zmm3, %zmm2
+// CHECK: vreducebf16 $123, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x56,0xd3,0x7b]
- vreducenepbf16 $123, %zmm3, %zmm2
+ vreducebf16 $123, %zmm3, %zmm2
-// CHECK: vreducenepbf16 $123, %zmm3, %zmm2 {%k7}
+// CHECK: vreducebf16 $123, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x56,0xd3,0x7b]
- vreducenepbf16 $123, %zmm3, %zmm2 {%k7}
+ vreducebf16 $123, %zmm3, %zmm2 {%k7}
-// CHECK: vreducenepbf16 $123, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vreducebf16 $123, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x56,0xd3,0x7b]
- vreducenepbf16 $123, %zmm3, %zmm2 {%k7} {z}
+ vreducebf16 $123, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vreducenepbf16 $123, %ymm3, %ymm2
+// CHECK: vreducebf16 $123, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x56,0xd3,0x7b]
- vreducenepbf16 $123, %ymm3, %ymm2
+ vreducebf16 $123, %ymm3, %ymm2
-// CHECK: vreducenepbf16 $123, %ymm3, %ymm2 {%k7}
+// CHECK: vreducebf16 $123, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x56,0xd3,0x7b]
- vreducenepbf16 $123, %ymm3, %ymm2 {%k7}
+ vreducebf16 $123, %ymm3, %ymm2 {%k7}
-// CHECK: vreducenepbf16 $123, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vreducebf16 $123, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x56,0xd3,0x7b]
- vreducenepbf16 $123, %ymm3, %ymm2 {%k7} {z}
+ vreducebf16 $123, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vreducenepbf16 $123, %xmm3, %xmm2
+// CHECK: vreducebf16 $123, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x56,0xd3,0x7b]
- vreducenepbf16 $123, %xmm3, %xmm2
+ vreducebf16 $123, %xmm3, %xmm2
-// CHECK: vreducenepbf16 $123, %xmm3, %xmm2 {%k7}
+// CHECK: vreducebf16 $123, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x56,0xd3,0x7b]
- vreducenepbf16 $123, %xmm3, %xmm2 {%k7}
+ vreducebf16 $123, %xmm3, %xmm2 {%k7}
-// CHECK: vreducenepbf16 $123, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vreducebf16 $123, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x56,0xd3,0x7b]
- vreducenepbf16 $123, %xmm3, %xmm2 {%k7} {z}
+ vreducebf16 $123, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vreducenepbf16 $123, 268435456(%esp,%esi,8), %xmm2
+// CHECK: vreducebf16 $123, 268435456(%esp,%esi,8), %xmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vreducenepbf16 $123, 268435456(%esp,%esi,8), %xmm2
+ vreducebf16 $123, 268435456(%esp,%esi,8), %xmm2
-// CHECK: vreducenepbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
+// CHECK: vreducebf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vreducenepbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
+ vreducebf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
-// CHECK: vreducenepbf16 $123, (%eax){1to8}, %xmm2
+// CHECK: vreducebf16 $123, (%eax){1to8}, %xmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x56,0x10,0x7b]
- vreducenepbf16 $123, (%eax){1to8}, %xmm2
+ vreducebf16 $123, (%eax){1to8}, %xmm2
-// CHECK: vreducenepbf16 $123, -512(,%ebp,2), %xmm2
+// CHECK: vreducebf16 $123, -512(,%ebp,2), %xmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x56,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vreducenepbf16 $123, -512(,%ebp,2), %xmm2
+ vreducebf16 $123, -512(,%ebp,2), %xmm2
-// CHECK: vreducenepbf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
+// CHECK: vreducebf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x56,0x51,0x7f,0x7b]
- vreducenepbf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
+ vreducebf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
-// CHECK: vreducenepbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
+// CHECK: vreducebf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0x9f,0x56,0x52,0x80,0x7b]
- vreducenepbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
+ vreducebf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
-// CHECK: vreducenepbf16 $123, 268435456(%esp,%esi,8), %ymm2
+// CHECK: vreducebf16 $123, 268435456(%esp,%esi,8), %ymm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vreducenepbf16 $123, 268435456(%esp,%esi,8), %ymm2
+ vreducebf16 $123, 268435456(%esp,%esi,8), %ymm2
-// CHECK: vreducenepbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
+// CHECK: vreducebf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vreducenepbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
+ vreducebf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
-// CHECK: vreducenepbf16 $123, (%eax){1to16}, %ymm2
+// CHECK: vreducebf16 $123, (%eax){1to16}, %ymm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x56,0x10,0x7b]
- vreducenepbf16 $123, (%eax){1to16}, %ymm2
+ vreducebf16 $123, (%eax){1to16}, %ymm2
-// CHECK: vreducenepbf16 $123, -1024(,%ebp,2), %ymm2
+// CHECK: vreducebf16 $123, -1024(,%ebp,2), %ymm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x56,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vreducenepbf16 $123, -1024(,%ebp,2), %ymm2
+ vreducebf16 $123, -1024(,%ebp,2), %ymm2
-// CHECK: vreducenepbf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
+// CHECK: vreducebf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x56,0x51,0x7f,0x7b]
- vreducenepbf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
+ vreducebf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
-// CHECK: vreducenepbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
+// CHECK: vreducebf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xbf,0x56,0x52,0x80,0x7b]
- vreducenepbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
+ vreducebf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
-// CHECK: vreducenepbf16 $123, 268435456(%esp,%esi,8), %zmm2
+// CHECK: vreducebf16 $123, 268435456(%esp,%esi,8), %zmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vreducenepbf16 $123, 268435456(%esp,%esi,8), %zmm2
+ vreducebf16 $123, 268435456(%esp,%esi,8), %zmm2
-// CHECK: vreducenepbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
+// CHECK: vreducebf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vreducenepbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
+ vreducebf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
-// CHECK: vreducenepbf16 $123, (%eax){1to32}, %zmm2
+// CHECK: vreducebf16 $123, (%eax){1to32}, %zmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x56,0x10,0x7b]
- vreducenepbf16 $123, (%eax){1to32}, %zmm2
+ vreducebf16 $123, (%eax){1to32}, %zmm2
-// CHECK: vreducenepbf16 $123, -2048(,%ebp,2), %zmm2
+// CHECK: vreducebf16 $123, -2048(,%ebp,2), %zmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x56,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vreducenepbf16 $123, -2048(,%ebp,2), %zmm2
+ vreducebf16 $123, -2048(,%ebp,2), %zmm2
-// CHECK: vreducenepbf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
+// CHECK: vreducebf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x56,0x51,0x7f,0x7b]
- vreducenepbf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
+ vreducebf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
-// CHECK: vreducenepbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
+// CHECK: vreducebf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xdf,0x56,0x52,0x80,0x7b]
- vreducenepbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
+ vreducebf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, %zmm3, %zmm2
+// CHECK: vrndscalebf16 $123, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x08,0xd3,0x7b]
- vrndscalenepbf16 $123, %zmm3, %zmm2
+ vrndscalebf16 $123, %zmm3, %zmm2
-// CHECK: vrndscalenepbf16 $123, %zmm3, %zmm2 {%k7}
+// CHECK: vrndscalebf16 $123, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x08,0xd3,0x7b]
- vrndscalenepbf16 $123, %zmm3, %zmm2 {%k7}
+ vrndscalebf16 $123, %zmm3, %zmm2 {%k7}
-// CHECK: vrndscalenepbf16 $123, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vrndscalebf16 $123, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x08,0xd3,0x7b]
- vrndscalenepbf16 $123, %zmm3, %zmm2 {%k7} {z}
+ vrndscalebf16 $123, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, %ymm3, %ymm2
+// CHECK: vrndscalebf16 $123, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x08,0xd3,0x7b]
- vrndscalenepbf16 $123, %ymm3, %ymm2
+ vrndscalebf16 $123, %ymm3, %ymm2
-// CHECK: vrndscalenepbf16 $123, %ymm3, %ymm2 {%k7}
+// CHECK: vrndscalebf16 $123, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x08,0xd3,0x7b]
- vrndscalenepbf16 $123, %ymm3, %ymm2 {%k7}
+ vrndscalebf16 $123, %ymm3, %ymm2 {%k7}
-// CHECK: vrndscalenepbf16 $123, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vrndscalebf16 $123, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x08,0xd3,0x7b]
- vrndscalenepbf16 $123, %ymm3, %ymm2 {%k7} {z}
+ vrndscalebf16 $123, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, %xmm3, %xmm2
+// CHECK: vrndscalebf16 $123, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x08,0xd3,0x7b]
- vrndscalenepbf16 $123, %xmm3, %xmm2
+ vrndscalebf16 $123, %xmm3, %xmm2
-// CHECK: vrndscalenepbf16 $123, %xmm3, %xmm2 {%k7}
+// CHECK: vrndscalebf16 $123, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x08,0xd3,0x7b]
- vrndscalenepbf16 $123, %xmm3, %xmm2 {%k7}
+ vrndscalebf16 $123, %xmm3, %xmm2 {%k7}
-// CHECK: vrndscalenepbf16 $123, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vrndscalebf16 $123, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x08,0xd3,0x7b]
- vrndscalenepbf16 $123, %xmm3, %xmm2 {%k7} {z}
+ vrndscalebf16 $123, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %xmm2
+// CHECK: vrndscalebf16 $123, 268435456(%esp,%esi,8), %xmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %xmm2
+ vrndscalebf16 $123, 268435456(%esp,%esi,8), %xmm2
-// CHECK: vrndscalenepbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
+// CHECK: vrndscalebf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vrndscalenepbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
+ vrndscalebf16 $123, 291(%edi,%eax,4), %xmm2 {%k7}
-// CHECK: vrndscalenepbf16 $123, (%eax){1to8}, %xmm2
+// CHECK: vrndscalebf16 $123, (%eax){1to8}, %xmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x08,0x10,0x7b]
- vrndscalenepbf16 $123, (%eax){1to8}, %xmm2
+ vrndscalebf16 $123, (%eax){1to8}, %xmm2
-// CHECK: vrndscalenepbf16 $123, -512(,%ebp,2), %xmm2
+// CHECK: vrndscalebf16 $123, -512(,%ebp,2), %xmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x08,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vrndscalenepbf16 $123, -512(,%ebp,2), %xmm2
+ vrndscalebf16 $123, -512(,%ebp,2), %xmm2
-// CHECK: vrndscalenepbf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
+// CHECK: vrndscalebf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x08,0x51,0x7f,0x7b]
- vrndscalenepbf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
+ vrndscalebf16 $123, 2032(%ecx), %xmm2 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
+// CHECK: vrndscalebf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0x9f,0x08,0x52,0x80,0x7b]
- vrndscalenepbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
+ vrndscalebf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %ymm2
+// CHECK: vrndscalebf16 $123, 268435456(%esp,%esi,8), %ymm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %ymm2
+ vrndscalebf16 $123, 268435456(%esp,%esi,8), %ymm2
-// CHECK: vrndscalenepbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
+// CHECK: vrndscalebf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vrndscalenepbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
+ vrndscalebf16 $123, 291(%edi,%eax,4), %ymm2 {%k7}
-// CHECK: vrndscalenepbf16 $123, (%eax){1to16}, %ymm2
+// CHECK: vrndscalebf16 $123, (%eax){1to16}, %ymm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x08,0x10,0x7b]
- vrndscalenepbf16 $123, (%eax){1to16}, %ymm2
+ vrndscalebf16 $123, (%eax){1to16}, %ymm2
-// CHECK: vrndscalenepbf16 $123, -1024(,%ebp,2), %ymm2
+// CHECK: vrndscalebf16 $123, -1024(,%ebp,2), %ymm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x08,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vrndscalenepbf16 $123, -1024(,%ebp,2), %ymm2
+ vrndscalebf16 $123, -1024(,%ebp,2), %ymm2
-// CHECK: vrndscalenepbf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
+// CHECK: vrndscalebf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x08,0x51,0x7f,0x7b]
- vrndscalenepbf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
+ vrndscalebf16 $123, 4064(%ecx), %ymm2 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
+// CHECK: vrndscalebf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xbf,0x08,0x52,0x80,0x7b]
- vrndscalenepbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
+ vrndscalebf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %zmm2
+// CHECK: vrndscalebf16 $123, 268435456(%esp,%esi,8), %zmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %zmm2
+ vrndscalebf16 $123, 268435456(%esp,%esi,8), %zmm2
-// CHECK: vrndscalenepbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
+// CHECK: vrndscalebf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vrndscalenepbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
+ vrndscalebf16 $123, 291(%edi,%eax,4), %zmm2 {%k7}
-// CHECK: vrndscalenepbf16 $123, (%eax){1to32}, %zmm2
+// CHECK: vrndscalebf16 $123, (%eax){1to32}, %zmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x08,0x10,0x7b]
- vrndscalenepbf16 $123, (%eax){1to32}, %zmm2
+ vrndscalebf16 $123, (%eax){1to32}, %zmm2
-// CHECK: vrndscalenepbf16 $123, -2048(,%ebp,2), %zmm2
+// CHECK: vrndscalebf16 $123, -2048(,%ebp,2), %zmm2
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x08,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vrndscalenepbf16 $123, -2048(,%ebp,2), %zmm2
+ vrndscalebf16 $123, -2048(,%ebp,2), %zmm2
-// CHECK: vrndscalenepbf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
+// CHECK: vrndscalebf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x08,0x51,0x7f,0x7b]
- vrndscalenepbf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
+ vrndscalebf16 $123, 8128(%ecx), %zmm2 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
+// CHECK: vrndscalebf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf3,0x7f,0xdf,0x08,0x52,0x80,0x7b]
- vrndscalenepbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
+ vrndscalebf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
-// CHECK: vrsqrtpbf16 %xmm3, %xmm2
+// CHECK: vrsqrtbf16 %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4e,0xd3]
- vrsqrtpbf16 %xmm3, %xmm2
+ vrsqrtbf16 %xmm3, %xmm2
-// CHECK: vrsqrtpbf16 %xmm3, %xmm2 {%k7}
+// CHECK: vrsqrtbf16 %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4e,0xd3]
- vrsqrtpbf16 %xmm3, %xmm2 {%k7}
+ vrsqrtbf16 %xmm3, %xmm2 {%k7}
-// CHECK: vrsqrtpbf16 %xmm3, %xmm2 {%k7} {z}
+// CHECK: vrsqrtbf16 %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4e,0xd3]
- vrsqrtpbf16 %xmm3, %xmm2 {%k7} {z}
+ vrsqrtbf16 %xmm3, %xmm2 {%k7} {z}
-// CHECK: vrsqrtpbf16 %zmm3, %zmm2
+// CHECK: vrsqrtbf16 %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4e,0xd3]
- vrsqrtpbf16 %zmm3, %zmm2
+ vrsqrtbf16 %zmm3, %zmm2
-// CHECK: vrsqrtpbf16 %zmm3, %zmm2 {%k7}
+// CHECK: vrsqrtbf16 %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4e,0xd3]
- vrsqrtpbf16 %zmm3, %zmm2 {%k7}
+ vrsqrtbf16 %zmm3, %zmm2 {%k7}
-// CHECK: vrsqrtpbf16 %zmm3, %zmm2 {%k7} {z}
+// CHECK: vrsqrtbf16 %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4e,0xd3]
- vrsqrtpbf16 %zmm3, %zmm2 {%k7} {z}
+ vrsqrtbf16 %zmm3, %zmm2 {%k7} {z}
-// CHECK: vrsqrtpbf16 %ymm3, %ymm2
+// CHECK: vrsqrtbf16 %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4e,0xd3]
- vrsqrtpbf16 %ymm3, %ymm2
+ vrsqrtbf16 %ymm3, %ymm2
-// CHECK: vrsqrtpbf16 %ymm3, %ymm2 {%k7}
+// CHECK: vrsqrtbf16 %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4e,0xd3]
- vrsqrtpbf16 %ymm3, %ymm2 {%k7}
+ vrsqrtbf16 %ymm3, %ymm2 {%k7}
-// CHECK: vrsqrtpbf16 %ymm3, %ymm2 {%k7} {z}
+// CHECK: vrsqrtbf16 %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4e,0xd3]
- vrsqrtpbf16 %ymm3, %ymm2 {%k7} {z}
+ vrsqrtbf16 %ymm3, %ymm2 {%k7} {z}
-// CHECK: vrsqrtpbf16 268435456(%esp,%esi,8), %xmm2
+// CHECK: vrsqrtbf16 268435456(%esp,%esi,8), %xmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vrsqrtpbf16 268435456(%esp,%esi,8), %xmm2
+ vrsqrtbf16 268435456(%esp,%esi,8), %xmm2
-// CHECK: vrsqrtpbf16 291(%edi,%eax,4), %xmm2 {%k7}
+// CHECK: vrsqrtbf16 291(%edi,%eax,4), %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00]
- vrsqrtpbf16 291(%edi,%eax,4), %xmm2 {%k7}
+ vrsqrtbf16 291(%edi,%eax,4), %xmm2 {%k7}
-// CHECK: vrsqrtpbf16 (%eax){1to8}, %xmm2
+// CHECK: vrsqrtbf16 (%eax){1to8}, %xmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x18,0x4e,0x10]
- vrsqrtpbf16 (%eax){1to8}, %xmm2
+ vrsqrtbf16 (%eax){1to8}, %xmm2
-// CHECK: vrsqrtpbf16 -512(,%ebp,2), %xmm2
+// CHECK: vrsqrtbf16 -512(,%ebp,2), %xmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4e,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vrsqrtpbf16 -512(,%ebp,2), %xmm2
+ vrsqrtbf16 -512(,%ebp,2), %xmm2
-// CHECK: vrsqrtpbf16 2032(%ecx), %xmm2 {%k7} {z}
+// CHECK: vrsqrtbf16 2032(%ecx), %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4e,0x51,0x7f]
- vrsqrtpbf16 2032(%ecx), %xmm2 {%k7} {z}
+ vrsqrtbf16 2032(%ecx), %xmm2 {%k7} {z}
-// CHECK: vrsqrtpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
+// CHECK: vrsqrtbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0x9f,0x4e,0x52,0x80]
- vrsqrtpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
+ vrsqrtbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
-// CHECK: vrsqrtpbf16 268435456(%esp,%esi,8), %ymm2
+// CHECK: vrsqrtbf16 268435456(%esp,%esi,8), %ymm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vrsqrtpbf16 268435456(%esp,%esi,8), %ymm2
+ vrsqrtbf16 268435456(%esp,%esi,8), %ymm2
-// CHECK: vrsqrtpbf16 291(%edi,%eax,4), %ymm2 {%k7}
+// CHECK: vrsqrtbf16 291(%edi,%eax,4), %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00]
- vrsqrtpbf16 291(%edi,%eax,4), %ymm2 {%k7}
+ vrsqrtbf16 291(%edi,%eax,4), %ymm2 {%k7}
-// CHECK: vrsqrtpbf16 (%eax){1to16}, %ymm2
+// CHECK: vrsqrtbf16 (%eax){1to16}, %ymm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x38,0x4e,0x10]
- vrsqrtpbf16 (%eax){1to16}, %ymm2
+ vrsqrtbf16 (%eax){1to16}, %ymm2
-// CHECK: vrsqrtpbf16 -1024(,%ebp,2), %ymm2
+// CHECK: vrsqrtbf16 -1024(,%ebp,2), %ymm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4e,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vrsqrtpbf16 -1024(,%ebp,2), %ymm2
+ vrsqrtbf16 -1024(,%ebp,2), %ymm2
-// CHECK: vrsqrtpbf16 4064(%ecx), %ymm2 {%k7} {z}
+// CHECK: vrsqrtbf16 4064(%ecx), %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4e,0x51,0x7f]
- vrsqrtpbf16 4064(%ecx), %ymm2 {%k7} {z}
+ vrsqrtbf16 4064(%ecx), %ymm2 {%k7} {z}
-// CHECK: vrsqrtpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
+// CHECK: vrsqrtbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0xbf,0x4e,0x52,0x80]
- vrsqrtpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
+ vrsqrtbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
-// CHECK: vrsqrtpbf16 268435456(%esp,%esi,8), %zmm2
+// CHECK: vrsqrtbf16 268435456(%esp,%esi,8), %zmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vrsqrtpbf16 268435456(%esp,%esi,8), %zmm2
+ vrsqrtbf16 268435456(%esp,%esi,8), %zmm2
-// CHECK: vrsqrtpbf16 291(%edi,%eax,4), %zmm2 {%k7}
+// CHECK: vrsqrtbf16 291(%edi,%eax,4), %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00]
- vrsqrtpbf16 291(%edi,%eax,4), %zmm2 {%k7}
+ vrsqrtbf16 291(%edi,%eax,4), %zmm2 {%k7}
-// CHECK: vrsqrtpbf16 (%eax){1to32}, %zmm2
+// CHECK: vrsqrtbf16 (%eax){1to32}, %zmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x58,0x4e,0x10]
- vrsqrtpbf16 (%eax){1to32}, %zmm2
+ vrsqrtbf16 (%eax){1to32}, %zmm2
-// CHECK: vrsqrtpbf16 -2048(,%ebp,2), %zmm2
+// CHECK: vrsqrtbf16 -2048(,%ebp,2), %zmm2
// CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4e,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vrsqrtpbf16 -2048(,%ebp,2), %zmm2
+ vrsqrtbf16 -2048(,%ebp,2), %zmm2
-// CHECK: vrsqrtpbf16 8128(%ecx), %zmm2 {%k7} {z}
+// CHECK: vrsqrtbf16 8128(%ecx), %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4e,0x51,0x7f]
- vrsqrtpbf16 8128(%ecx), %zmm2 {%k7} {z}
+ vrsqrtbf16 8128(%ecx), %zmm2 {%k7} {z}
-// CHECK: vrsqrtpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
+// CHECK: vrsqrtbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x7c,0xdf,0x4e,0x52,0x80]
- vrsqrtpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
+ vrsqrtbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
-// CHECK: vscalefpbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vscalefbf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x2c,0xd4]
- vscalefpbf16 %ymm4, %ymm3, %ymm2
+ vscalefbf16 %ymm4, %ymm3, %ymm2
-// CHECK: vscalefpbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vscalefbf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x2c,0xd4]
- vscalefpbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vscalefbf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vscalefpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vscalefbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x2c,0xd4]
- vscalefpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vscalefbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vscalefpbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vscalefbf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x2c,0xd4]
- vscalefpbf16 %zmm4, %zmm3, %zmm2
+ vscalefbf16 %zmm4, %zmm3, %zmm2
-// CHECK: vscalefpbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vscalefbf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x2c,0xd4]
- vscalefpbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vscalefbf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vscalefpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vscalefbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x2c,0xd4]
- vscalefpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vscalefbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vscalefpbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vscalefbf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x2c,0xd4]
- vscalefpbf16 %xmm4, %xmm3, %xmm2
+ vscalefbf16 %xmm4, %xmm3, %xmm2
-// CHECK: vscalefpbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vscalefbf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x2c,0xd4]
- vscalefpbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vscalefbf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vscalefpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vscalefbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x2c,0xd4]
- vscalefpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vscalefbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vscalefpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vscalefbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vscalefpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vscalefbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vscalefpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vscalefbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00]
- vscalefpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vscalefbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vscalefpbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vscalefbf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0x2c,0x10]
- vscalefpbf16 (%eax){1to32}, %zmm3, %zmm2
+ vscalefbf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vscalefpbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vscalefbf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x2c,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vscalefpbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vscalefbf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vscalefpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vscalefbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x2c,0x51,0x7f]
- vscalefpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vscalefbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vscalefpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vscalefbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x2c,0x52,0x80]
- vscalefpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vscalefbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vscalefpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vscalefbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vscalefpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vscalefbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vscalefpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vscalefbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00]
- vscalefpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vscalefbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vscalefpbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vscalefbf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0x2c,0x10]
- vscalefpbf16 (%eax){1to16}, %ymm3, %ymm2
+ vscalefbf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vscalefpbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vscalefbf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x2c,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vscalefpbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vscalefbf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vscalefpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vscalefbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x2c,0x51,0x7f]
- vscalefpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vscalefbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vscalefpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vscalefbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x2c,0x52,0x80]
- vscalefpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vscalefbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vscalefpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vscalefbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vscalefpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vscalefbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vscalefpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vscalefbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00]
- vscalefpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vscalefbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vscalefpbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vscalefbf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0x2c,0x10]
- vscalefpbf16 (%eax){1to8}, %xmm3, %xmm2
+ vscalefbf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vscalefpbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vscalefbf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x2c,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vscalefpbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vscalefbf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vscalefpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vscalefbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x2c,0x51,0x7f]
- vscalefpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vscalefbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vscalefpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vscalefbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x2c,0x52,0x80]
- vscalefpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vscalefbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vsqrtnepbf16 %xmm3, %xmm2
+// CHECK: vsqrtbf16 %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x51,0xd3]
- vsqrtnepbf16 %xmm3, %xmm2
+ vsqrtbf16 %xmm3, %xmm2
-// CHECK: vsqrtnepbf16 %xmm3, %xmm2 {%k7}
+// CHECK: vsqrtbf16 %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x51,0xd3]
- vsqrtnepbf16 %xmm3, %xmm2 {%k7}
+ vsqrtbf16 %xmm3, %xmm2 {%k7}
-// CHECK: vsqrtnepbf16 %xmm3, %xmm2 {%k7} {z}
+// CHECK: vsqrtbf16 %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x51,0xd3]
- vsqrtnepbf16 %xmm3, %xmm2 {%k7} {z}
+ vsqrtbf16 %xmm3, %xmm2 {%k7} {z}
-// CHECK: vsqrtnepbf16 %zmm3, %zmm2
+// CHECK: vsqrtbf16 %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x51,0xd3]
- vsqrtnepbf16 %zmm3, %zmm2
+ vsqrtbf16 %zmm3, %zmm2
-// CHECK: vsqrtnepbf16 %zmm3, %zmm2 {%k7}
+// CHECK: vsqrtbf16 %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x51,0xd3]
- vsqrtnepbf16 %zmm3, %zmm2 {%k7}
+ vsqrtbf16 %zmm3, %zmm2 {%k7}
-// CHECK: vsqrtnepbf16 %zmm3, %zmm2 {%k7} {z}
+// CHECK: vsqrtbf16 %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x51,0xd3]
- vsqrtnepbf16 %zmm3, %zmm2 {%k7} {z}
+ vsqrtbf16 %zmm3, %zmm2 {%k7} {z}
-// CHECK: vsqrtnepbf16 %ymm3, %ymm2
+// CHECK: vsqrtbf16 %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x51,0xd3]
- vsqrtnepbf16 %ymm3, %ymm2
+ vsqrtbf16 %ymm3, %ymm2
-// CHECK: vsqrtnepbf16 %ymm3, %ymm2 {%k7}
+// CHECK: vsqrtbf16 %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x51,0xd3]
- vsqrtnepbf16 %ymm3, %ymm2 {%k7}
+ vsqrtbf16 %ymm3, %ymm2 {%k7}
-// CHECK: vsqrtnepbf16 %ymm3, %ymm2 {%k7} {z}
+// CHECK: vsqrtbf16 %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x51,0xd3]
- vsqrtnepbf16 %ymm3, %ymm2 {%k7} {z}
+ vsqrtbf16 %ymm3, %ymm2 {%k7} {z}
-// CHECK: vsqrtnepbf16 268435456(%esp,%esi,8), %xmm2
+// CHECK: vsqrtbf16 268435456(%esp,%esi,8), %xmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x51,0x94,0xf4,0x00,0x00,0x00,0x10]
- vsqrtnepbf16 268435456(%esp,%esi,8), %xmm2
+ vsqrtbf16 268435456(%esp,%esi,8), %xmm2
-// CHECK: vsqrtnepbf16 291(%edi,%eax,4), %xmm2 {%k7}
+// CHECK: vsqrtbf16 291(%edi,%eax,4), %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x51,0x94,0x87,0x23,0x01,0x00,0x00]
- vsqrtnepbf16 291(%edi,%eax,4), %xmm2 {%k7}
+ vsqrtbf16 291(%edi,%eax,4), %xmm2 {%k7}
-// CHECK: vsqrtnepbf16 (%eax){1to8}, %xmm2
+// CHECK: vsqrtbf16 (%eax){1to8}, %xmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x18,0x51,0x10]
- vsqrtnepbf16 (%eax){1to8}, %xmm2
+ vsqrtbf16 (%eax){1to8}, %xmm2
-// CHECK: vsqrtnepbf16 -512(,%ebp,2), %xmm2
+// CHECK: vsqrtbf16 -512(,%ebp,2), %xmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x51,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vsqrtnepbf16 -512(,%ebp,2), %xmm2
+ vsqrtbf16 -512(,%ebp,2), %xmm2
-// CHECK: vsqrtnepbf16 2032(%ecx), %xmm2 {%k7} {z}
+// CHECK: vsqrtbf16 2032(%ecx), %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x51,0x51,0x7f]
- vsqrtnepbf16 2032(%ecx), %xmm2 {%k7} {z}
+ vsqrtbf16 2032(%ecx), %xmm2 {%k7} {z}
-// CHECK: vsqrtnepbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
+// CHECK: vsqrtbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0x9f,0x51,0x52,0x80]
- vsqrtnepbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
+ vsqrtbf16 -256(%edx){1to8}, %xmm2 {%k7} {z}
-// CHECK: vsqrtnepbf16 268435456(%esp,%esi,8), %ymm2
+// CHECK: vsqrtbf16 268435456(%esp,%esi,8), %ymm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x51,0x94,0xf4,0x00,0x00,0x00,0x10]
- vsqrtnepbf16 268435456(%esp,%esi,8), %ymm2
+ vsqrtbf16 268435456(%esp,%esi,8), %ymm2
-// CHECK: vsqrtnepbf16 291(%edi,%eax,4), %ymm2 {%k7}
+// CHECK: vsqrtbf16 291(%edi,%eax,4), %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x51,0x94,0x87,0x23,0x01,0x00,0x00]
- vsqrtnepbf16 291(%edi,%eax,4), %ymm2 {%k7}
+ vsqrtbf16 291(%edi,%eax,4), %ymm2 {%k7}
-// CHECK: vsqrtnepbf16 (%eax){1to16}, %ymm2
+// CHECK: vsqrtbf16 (%eax){1to16}, %ymm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x38,0x51,0x10]
- vsqrtnepbf16 (%eax){1to16}, %ymm2
+ vsqrtbf16 (%eax){1to16}, %ymm2
-// CHECK: vsqrtnepbf16 -1024(,%ebp,2), %ymm2
+// CHECK: vsqrtbf16 -1024(,%ebp,2), %ymm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x51,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vsqrtnepbf16 -1024(,%ebp,2), %ymm2
+ vsqrtbf16 -1024(,%ebp,2), %ymm2
-// CHECK: vsqrtnepbf16 4064(%ecx), %ymm2 {%k7} {z}
+// CHECK: vsqrtbf16 4064(%ecx), %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x51,0x51,0x7f]
- vsqrtnepbf16 4064(%ecx), %ymm2 {%k7} {z}
+ vsqrtbf16 4064(%ecx), %ymm2 {%k7} {z}
-// CHECK: vsqrtnepbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
+// CHECK: vsqrtbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0xbf,0x51,0x52,0x80]
- vsqrtnepbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
+ vsqrtbf16 -256(%edx){1to16}, %ymm2 {%k7} {z}
-// CHECK: vsqrtnepbf16 268435456(%esp,%esi,8), %zmm2
+// CHECK: vsqrtbf16 268435456(%esp,%esi,8), %zmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x51,0x94,0xf4,0x00,0x00,0x00,0x10]
- vsqrtnepbf16 268435456(%esp,%esi,8), %zmm2
+ vsqrtbf16 268435456(%esp,%esi,8), %zmm2
-// CHECK: vsqrtnepbf16 291(%edi,%eax,4), %zmm2 {%k7}
+// CHECK: vsqrtbf16 291(%edi,%eax,4), %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x51,0x94,0x87,0x23,0x01,0x00,0x00]
- vsqrtnepbf16 291(%edi,%eax,4), %zmm2 {%k7}
+ vsqrtbf16 291(%edi,%eax,4), %zmm2 {%k7}
-// CHECK: vsqrtnepbf16 (%eax){1to32}, %zmm2
+// CHECK: vsqrtbf16 (%eax){1to32}, %zmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x58,0x51,0x10]
- vsqrtnepbf16 (%eax){1to32}, %zmm2
+ vsqrtbf16 (%eax){1to32}, %zmm2
-// CHECK: vsqrtnepbf16 -2048(,%ebp,2), %zmm2
+// CHECK: vsqrtbf16 -2048(,%ebp,2), %zmm2
// CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x51,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vsqrtnepbf16 -2048(,%ebp,2), %zmm2
+ vsqrtbf16 -2048(,%ebp,2), %zmm2
-// CHECK: vsqrtnepbf16 8128(%ecx), %zmm2 {%k7} {z}
+// CHECK: vsqrtbf16 8128(%ecx), %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x51,0x51,0x7f]
- vsqrtnepbf16 8128(%ecx), %zmm2 {%k7} {z}
+ vsqrtbf16 8128(%ecx), %zmm2 {%k7} {z}
-// CHECK: vsqrtnepbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
+// CHECK: vsqrtbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x7d,0xdf,0x51,0x52,0x80]
- vsqrtnepbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
+ vsqrtbf16 -256(%edx){1to32}, %zmm2 {%k7} {z}
-// CHECK: vsubnepbf16 %ymm4, %ymm3, %ymm2
+// CHECK: vsubbf16 %ymm4, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5c,0xd4]
- vsubnepbf16 %ymm4, %ymm3, %ymm2
+ vsubbf16 %ymm4, %ymm3, %ymm2
-// CHECK: vsubnepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+// CHECK: vsubbf16 %ymm4, %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5c,0xd4]
- vsubnepbf16 %ymm4, %ymm3, %ymm2 {%k7}
+ vsubbf16 %ymm4, %ymm3, %ymm2 {%k7}
-// CHECK: vsubnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vsubbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5c,0xd4]
- vsubnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
+ vsubbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vsubnepbf16 %zmm4, %zmm3, %zmm2
+// CHECK: vsubbf16 %zmm4, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5c,0xd4]
- vsubnepbf16 %zmm4, %zmm3, %zmm2
+ vsubbf16 %zmm4, %zmm3, %zmm2
-// CHECK: vsubnepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+// CHECK: vsubbf16 %zmm4, %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5c,0xd4]
- vsubnepbf16 %zmm4, %zmm3, %zmm2 {%k7}
+ vsubbf16 %zmm4, %zmm3, %zmm2 {%k7}
-// CHECK: vsubnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vsubbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5c,0xd4]
- vsubnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
+ vsubbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vsubnepbf16 %xmm4, %xmm3, %xmm2
+// CHECK: vsubbf16 %xmm4, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5c,0xd4]
- vsubnepbf16 %xmm4, %xmm3, %xmm2
+ vsubbf16 %xmm4, %xmm3, %xmm2
-// CHECK: vsubnepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+// CHECK: vsubbf16 %xmm4, %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5c,0xd4]
- vsubnepbf16 %xmm4, %xmm3, %xmm2 {%k7}
+ vsubbf16 %xmm4, %xmm3, %xmm2 {%k7}
-// CHECK: vsubnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vsubbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5c,0xd4]
- vsubnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
+ vsubbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
-// CHECK: vsubnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+// CHECK: vsubbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vsubnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
+ vsubbf16 268435456(%esp,%esi,8), %zmm3, %zmm2
-// CHECK: vsubnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+// CHECK: vsubbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00]
- vsubnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
+ vsubbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
-// CHECK: vsubnepbf16 (%eax){1to32}, %zmm3, %zmm2
+// CHECK: vsubbf16 (%eax){1to32}, %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5c,0x10]
- vsubnepbf16 (%eax){1to32}, %zmm3, %zmm2
+ vsubbf16 (%eax){1to32}, %zmm3, %zmm2
-// CHECK: vsubnepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+// CHECK: vsubbf16 -2048(,%ebp,2), %zmm3, %zmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5c,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vsubnepbf16 -2048(,%ebp,2), %zmm3, %zmm2
+ vsubbf16 -2048(,%ebp,2), %zmm3, %zmm2
-// CHECK: vsubnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+// CHECK: vsubbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5c,0x51,0x7f]
- vsubnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
+ vsubbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z}
-// CHECK: vsubnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+// CHECK: vsubbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5c,0x52,0x80]
- vsubnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
+ vsubbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
-// CHECK: vsubnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+// CHECK: vsubbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vsubnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
+ vsubbf16 268435456(%esp,%esi,8), %ymm3, %ymm2
-// CHECK: vsubnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+// CHECK: vsubbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00]
- vsubnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
+ vsubbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
-// CHECK: vsubnepbf16 (%eax){1to16}, %ymm3, %ymm2
+// CHECK: vsubbf16 (%eax){1to16}, %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5c,0x10]
- vsubnepbf16 (%eax){1to16}, %ymm3, %ymm2
+ vsubbf16 (%eax){1to16}, %ymm3, %ymm2
-// CHECK: vsubnepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+// CHECK: vsubbf16 -1024(,%ebp,2), %ymm3, %ymm2
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5c,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vsubnepbf16 -1024(,%ebp,2), %ymm3, %ymm2
+ vsubbf16 -1024(,%ebp,2), %ymm3, %ymm2
-// CHECK: vsubnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+// CHECK: vsubbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5c,0x51,0x7f]
- vsubnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
+ vsubbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z}
-// CHECK: vsubnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+// CHECK: vsubbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5c,0x52,0x80]
- vsubnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
+ vsubbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
-// CHECK: vsubnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+// CHECK: vsubbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vsubnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
+ vsubbf16 268435456(%esp,%esi,8), %xmm3, %xmm2
-// CHECK: vsubnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+// CHECK: vsubbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00]
- vsubnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
+ vsubbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
-// CHECK: vsubnepbf16 (%eax){1to8}, %xmm3, %xmm2
+// CHECK: vsubbf16 (%eax){1to8}, %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5c,0x10]
- vsubnepbf16 (%eax){1to8}, %xmm3, %xmm2
+ vsubbf16 (%eax){1to8}, %xmm3, %xmm2
-// CHECK: vsubnepbf16 -512(,%ebp,2), %xmm3, %xmm2
+// CHECK: vsubbf16 -512(,%ebp,2), %xmm3, %xmm2
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5c,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vsubnepbf16 -512(,%ebp,2), %xmm3, %xmm2
+ vsubbf16 -512(,%ebp,2), %xmm3, %xmm2
-// CHECK: vsubnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+// CHECK: vsubbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5c,0x51,0x7f]
- vsubnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
+ vsubbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z}
-// CHECK: vsubnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+// CHECK: vsubbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
// CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5c,0x52,0x80]
- vsubnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
+ vsubbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
diff --git a/llvm/test/MC/X86/avx10.2-bf16-32-intel.s b/llvm/test/MC/X86/avx10.2-bf16-32-intel.s
index 30c2cf45297bc0..f19e41d52d4ee3 100644
--- a/llvm/test/MC/X86/avx10.2-bf16-32-intel.s
+++ b/llvm/test/MC/X86/avx10.2-bf16-32-intel.s
@@ -1,208 +1,208 @@
// RUN: llvm-mc -triple i386 -x86-asm-syntax=intel -output-asm-variant=1 --show-encoding %s | FileCheck %s
-// CHECK: vaddnepbf16 ymm2, ymm3, ymm4
+// CHECK: vaddbf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x58,0xd4]
- vaddnepbf16 ymm2, ymm3, ymm4
+ vaddbf16 ymm2, ymm3, ymm4
-// CHECK: vaddnepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vaddbf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x58,0xd4]
- vaddnepbf16 ymm2 {k7}, ymm3, ymm4
+ vaddbf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vaddnepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vaddbf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x58,0xd4]
- vaddnepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vaddbf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vaddnepbf16 zmm2, zmm3, zmm4
+// CHECK: vaddbf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x58,0xd4]
- vaddnepbf16 zmm2, zmm3, zmm4
+ vaddbf16 zmm2, zmm3, zmm4
-// CHECK: vaddnepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vaddbf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x58,0xd4]
- vaddnepbf16 zmm2 {k7}, zmm3, zmm4
+ vaddbf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vaddnepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vaddbf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x58,0xd4]
- vaddnepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vaddbf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vaddnepbf16 xmm2, xmm3, xmm4
+// CHECK: vaddbf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x58,0xd4]
- vaddnepbf16 xmm2, xmm3, xmm4
+ vaddbf16 xmm2, xmm3, xmm4
-// CHECK: vaddnepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vaddbf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x58,0xd4]
- vaddnepbf16 xmm2 {k7}, xmm3, xmm4
+ vaddbf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vaddnepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vaddbf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x58,0xd4]
- vaddnepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vaddbf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vaddnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vaddbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x58,0x94,0xf4,0x00,0x00,0x00,0x10]
- vaddnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vaddbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vaddnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vaddbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x58,0x94,0x87,0x23,0x01,0x00,0x00]
- vaddnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vaddbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vaddnepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vaddbf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf5,0x65,0x58,0x58,0x10]
- vaddnepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vaddbf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vaddnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vaddbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x58,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vaddnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vaddbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vaddnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vaddbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x58,0x51,0x7f]
- vaddnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vaddbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vaddnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vaddbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x58,0x52,0x80]
- vaddnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vaddbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vaddnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vaddbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x58,0x94,0xf4,0x00,0x00,0x00,0x10]
- vaddnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vaddbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vaddnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vaddbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x58,0x94,0x87,0x23,0x01,0x00,0x00]
- vaddnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vaddbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vaddnepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vaddbf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf5,0x65,0x38,0x58,0x10]
- vaddnepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vaddbf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vaddnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vaddbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x58,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vaddnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vaddbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vaddnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vaddbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x58,0x51,0x7f]
- vaddnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vaddbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vaddnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vaddbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x58,0x52,0x80]
- vaddnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vaddbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vaddnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vaddbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x58,0x94,0xf4,0x00,0x00,0x00,0x10]
- vaddnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vaddbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vaddnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vaddbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x58,0x94,0x87,0x23,0x01,0x00,0x00]
- vaddnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vaddbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vaddnepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vaddbf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf5,0x65,0x18,0x58,0x10]
- vaddnepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vaddbf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vaddnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vaddbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x58,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vaddnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vaddbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vaddnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vaddbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x58,0x51,0x7f]
- vaddnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vaddbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vaddnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vaddbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x58,0x52,0x80]
- vaddnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vaddbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vcmppbf16 k5, ymm3, ymm4, 123
+// CHECK: vcmpbf16 k5, ymm3, ymm4, 123
// CHECK: encoding: [0x62,0xf3,0x67,0x28,0xc2,0xec,0x7b]
- vcmppbf16 k5, ymm3, ymm4, 123
+ vcmpbf16 k5, ymm3, ymm4, 123
-// CHECK: vcmppbf16 k5 {k7}, ymm3, ymm4, 123
+// CHECK: vcmpbf16 k5 {k7}, ymm3, ymm4, 123
// CHECK: encoding: [0x62,0xf3,0x67,0x2f,0xc2,0xec,0x7b]
- vcmppbf16 k5 {k7}, ymm3, ymm4, 123
+ vcmpbf16 k5 {k7}, ymm3, ymm4, 123
-// CHECK: vcmppbf16 k5, xmm3, xmm4, 123
+// CHECK: vcmpbf16 k5, xmm3, xmm4, 123
// CHECK: encoding: [0x62,0xf3,0x67,0x08,0xc2,0xec,0x7b]
- vcmppbf16 k5, xmm3, xmm4, 123
+ vcmpbf16 k5, xmm3, xmm4, 123
-// CHECK: vcmppbf16 k5 {k7}, xmm3, xmm4, 123
+// CHECK: vcmpbf16 k5 {k7}, xmm3, xmm4, 123
// CHECK: encoding: [0x62,0xf3,0x67,0x0f,0xc2,0xec,0x7b]
- vcmppbf16 k5 {k7}, xmm3, xmm4, 123
+ vcmpbf16 k5 {k7}, xmm3, xmm4, 123
-// CHECK: vcmppbf16 k5, zmm3, zmm4, 123
+// CHECK: vcmpbf16 k5, zmm3, zmm4, 123
// CHECK: encoding: [0x62,0xf3,0x67,0x48,0xc2,0xec,0x7b]
- vcmppbf16 k5, zmm3, zmm4, 123
+ vcmpbf16 k5, zmm3, zmm4, 123
-// CHECK: vcmppbf16 k5 {k7}, zmm3, zmm4, 123
+// CHECK: vcmpbf16 k5 {k7}, zmm3, zmm4, 123
// CHECK: encoding: [0x62,0xf3,0x67,0x4f,0xc2,0xec,0x7b]
- vcmppbf16 k5 {k7}, zmm3, zmm4, 123
+ vcmpbf16 k5 {k7}, zmm3, zmm4, 123
-// CHECK: vcmppbf16 k5, zmm3, zmmword ptr [esp + 8*esi + 268435456], 123
+// CHECK: vcmpbf16 k5, zmm3, zmmword ptr [esp + 8*esi + 268435456], 123
// CHECK: encoding: [0x62,0xf3,0x67,0x48,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vcmppbf16 k5, zmm3, zmmword ptr [esp + 8*esi + 268435456], 123
+ vcmpbf16 k5, zmm3, zmmword ptr [esp + 8*esi + 268435456], 123
-// CHECK: vcmppbf16 k5 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291], 123
+// CHECK: vcmpbf16 k5 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291], 123
// CHECK: encoding: [0x62,0xf3,0x67,0x4f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b]
- vcmppbf16 k5 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291], 123
+ vcmpbf16 k5 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291], 123
-// CHECK: vcmppbf16 k5, zmm3, word ptr [eax]{1to32}, 123
+// CHECK: vcmpbf16 k5, zmm3, word ptr [eax]{1to32}, 123
// CHECK: encoding: [0x62,0xf3,0x67,0x58,0xc2,0x28,0x7b]
- vcmppbf16 k5, zmm3, word ptr [eax]{1to32}, 123
+ vcmpbf16 k5, zmm3, word ptr [eax]{1to32}, 123
-// CHECK: vcmppbf16 k5, zmm3, zmmword ptr [2*ebp - 2048], 123
+// CHECK: vcmpbf16 k5, zmm3, zmmword ptr [2*ebp - 2048], 123
// CHECK: encoding: [0x62,0xf3,0x67,0x48,0xc2,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vcmppbf16 k5, zmm3, zmmword ptr [2*ebp - 2048], 123
+ vcmpbf16 k5, zmm3, zmmword ptr [2*ebp - 2048], 123
-// CHECK: vcmppbf16 k5 {k7}, zmm3, zmmword ptr [ecx + 8128], 123
+// CHECK: vcmpbf16 k5 {k7}, zmm3, zmmword ptr [ecx + 8128], 123
// CHECK: encoding: [0x62,0xf3,0x67,0x4f,0xc2,0x69,0x7f,0x7b]
- vcmppbf16 k5 {k7}, zmm3, zmmword ptr [ecx + 8128], 123
+ vcmpbf16 k5 {k7}, zmm3, zmmword ptr [ecx + 8128], 123
-// CHECK: vcmppbf16 k5 {k7}, zmm3, word ptr [edx - 256]{1to32}, 123
+// CHECK: vcmpbf16 k5 {k7}, zmm3, word ptr [edx - 256]{1to32}, 123
// CHECK: encoding: [0x62,0xf3,0x67,0x5f,0xc2,0x6a,0x80,0x7b]
- vcmppbf16 k5 {k7}, zmm3, word ptr [edx - 256]{1to32}, 123
+ vcmpbf16 k5 {k7}, zmm3, word ptr [edx - 256]{1to32}, 123
-// CHECK: vcmppbf16 k5, xmm3, xmmword ptr [esp + 8*esi + 268435456], 123
+// CHECK: vcmpbf16 k5, xmm3, xmmword ptr [esp + 8*esi + 268435456], 123
// CHECK: encoding: [0x62,0xf3,0x67,0x08,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vcmppbf16 k5, xmm3, xmmword ptr [esp + 8*esi + 268435456], 123
+ vcmpbf16 k5, xmm3, xmmword ptr [esp + 8*esi + 268435456], 123
-// CHECK: vcmppbf16 k5 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291], 123
+// CHECK: vcmpbf16 k5 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291], 123
// CHECK: encoding: [0x62,0xf3,0x67,0x0f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b]
- vcmppbf16 k5 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291], 123
+ vcmpbf16 k5 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291], 123
-// CHECK: vcmppbf16 k5, xmm3, word ptr [eax]{1to8}, 123
+// CHECK: vcmpbf16 k5, xmm3, word ptr [eax]{1to8}, 123
// CHECK: encoding: [0x62,0xf3,0x67,0x18,0xc2,0x28,0x7b]
- vcmppbf16 k5, xmm3, word ptr [eax]{1to8}, 123
+ vcmpbf16 k5, xmm3, word ptr [eax]{1to8}, 123
-// CHECK: vcmppbf16 k5, xmm3, xmmword ptr [2*ebp - 512], 123
+// CHECK: vcmpbf16 k5, xmm3, xmmword ptr [2*ebp - 512], 123
// CHECK: encoding: [0x62,0xf3,0x67,0x08,0xc2,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vcmppbf16 k5, xmm3, xmmword ptr [2*ebp - 512], 123
+ vcmpbf16 k5, xmm3, xmmword ptr [2*ebp - 512], 123
-// CHECK: vcmppbf16 k5 {k7}, xmm3, xmmword ptr [ecx + 2032], 123
+// CHECK: vcmpbf16 k5 {k7}, xmm3, xmmword ptr [ecx + 2032], 123
// CHECK: encoding: [0x62,0xf3,0x67,0x0f,0xc2,0x69,0x7f,0x7b]
- vcmppbf16 k5 {k7}, xmm3, xmmword ptr [ecx + 2032], 123
+ vcmpbf16 k5 {k7}, xmm3, xmmword ptr [ecx + 2032], 123
-// CHECK: vcmppbf16 k5 {k7}, xmm3, word ptr [edx - 256]{1to8}, 123
+// CHECK: vcmpbf16 k5 {k7}, xmm3, word ptr [edx - 256]{1to8}, 123
// CHECK: encoding: [0x62,0xf3,0x67,0x1f,0xc2,0x6a,0x80,0x7b]
- vcmppbf16 k5 {k7}, xmm3, word ptr [edx - 256]{1to8}, 123
+ vcmpbf16 k5 {k7}, xmm3, word ptr [edx - 256]{1to8}, 123
-// CHECK: vcmppbf16 k5, ymm3, ymmword ptr [esp + 8*esi + 268435456], 123
+// CHECK: vcmpbf16 k5, ymm3, ymmword ptr [esp + 8*esi + 268435456], 123
// CHECK: encoding: [0x62,0xf3,0x67,0x28,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vcmppbf16 k5, ymm3, ymmword ptr [esp + 8*esi + 268435456], 123
+ vcmpbf16 k5, ymm3, ymmword ptr [esp + 8*esi + 268435456], 123
-// CHECK: vcmppbf16 k5 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291], 123
+// CHECK: vcmpbf16 k5 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291], 123
// CHECK: encoding: [0x62,0xf3,0x67,0x2f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b]
- vcmppbf16 k5 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291], 123
+ vcmpbf16 k5 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291], 123
-// CHECK: vcmppbf16 k5, ymm3, word ptr [eax]{1to16}, 123
+// CHECK: vcmpbf16 k5, ymm3, word ptr [eax]{1to16}, 123
// CHECK: encoding: [0x62,0xf3,0x67,0x38,0xc2,0x28,0x7b]
- vcmppbf16 k5, ymm3, word ptr [eax]{1to16}, 123
+ vcmpbf16 k5, ymm3, word ptr [eax]{1to16}, 123
-// CHECK: vcmppbf16 k5, ymm3, ymmword ptr [2*ebp - 1024], 123
+// CHECK: vcmpbf16 k5, ymm3, ymmword ptr [2*ebp - 1024], 123
// CHECK: encoding: [0x62,0xf3,0x67,0x28,0xc2,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vcmppbf16 k5, ymm3, ymmword ptr [2*ebp - 1024], 123
+ vcmpbf16 k5, ymm3, ymmword ptr [2*ebp - 1024], 123
-// CHECK: vcmppbf16 k5 {k7}, ymm3, ymmword ptr [ecx + 4064], 123
+// CHECK: vcmpbf16 k5 {k7}, ymm3, ymmword ptr [ecx + 4064], 123
// CHECK: encoding: [0x62,0xf3,0x67,0x2f,0xc2,0x69,0x7f,0x7b]
- vcmppbf16 k5 {k7}, ymm3, ymmword ptr [ecx + 4064], 123
+ vcmpbf16 k5 {k7}, ymm3, ymmword ptr [ecx + 4064], 123
-// CHECK: vcmppbf16 k5 {k7}, ymm3, word ptr [edx - 256]{1to16}, 123
+// CHECK: vcmpbf16 k5 {k7}, ymm3, word ptr [edx - 256]{1to16}, 123
// CHECK: encoding: [0x62,0xf3,0x67,0x3f,0xc2,0x6a,0x80,0x7b]
- vcmppbf16 k5 {k7}, ymm3, word ptr [edx - 256]{1to16}, 123
+ vcmpbf16 k5 {k7}, ymm3, word ptr [edx - 256]{1to16}, 123
// CHECK: vcomsbf16 xmm2, xmm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x2f,0xd3]
@@ -232,2783 +232,2783 @@
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x2f,0x52,0x80]
vcomsbf16 xmm2, word ptr [edx - 256]
-// CHECK: vdivnepbf16 ymm2, ymm3, ymm4
+// CHECK: vdivbf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5e,0xd4]
- vdivnepbf16 ymm2, ymm3, ymm4
+ vdivbf16 ymm2, ymm3, ymm4
-// CHECK: vdivnepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vdivbf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5e,0xd4]
- vdivnepbf16 ymm2 {k7}, ymm3, ymm4
+ vdivbf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vdivnepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vdivbf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5e,0xd4]
- vdivnepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vdivbf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vdivnepbf16 zmm2, zmm3, zmm4
+// CHECK: vdivbf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5e,0xd4]
- vdivnepbf16 zmm2, zmm3, zmm4
+ vdivbf16 zmm2, zmm3, zmm4
-// CHECK: vdivnepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vdivbf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5e,0xd4]
- vdivnepbf16 zmm2 {k7}, zmm3, zmm4
+ vdivbf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vdivnepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vdivbf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5e,0xd4]
- vdivnepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vdivbf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vdivnepbf16 xmm2, xmm3, xmm4
+// CHECK: vdivbf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5e,0xd4]
- vdivnepbf16 xmm2, xmm3, xmm4
+ vdivbf16 xmm2, xmm3, xmm4
-// CHECK: vdivnepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vdivbf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5e,0xd4]
- vdivnepbf16 xmm2 {k7}, xmm3, xmm4
+ vdivbf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vdivnepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vdivbf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5e,0xd4]
- vdivnepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vdivbf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vdivnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vdivbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vdivnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vdivbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vdivnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vdivbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00]
- vdivnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vdivbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vdivnepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vdivbf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5e,0x10]
- vdivnepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vdivbf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vdivnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vdivbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5e,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vdivnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vdivbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vdivnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vdivbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5e,0x51,0x7f]
- vdivnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vdivbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vdivnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vdivbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5e,0x52,0x80]
- vdivnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vdivbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vdivnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vdivbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vdivnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vdivbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vdivnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vdivbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00]
- vdivnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vdivbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vdivnepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vdivbf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5e,0x10]
- vdivnepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vdivbf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vdivnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vdivbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5e,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vdivnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vdivbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vdivnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vdivbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5e,0x51,0x7f]
- vdivnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vdivbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vdivnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vdivbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5e,0x52,0x80]
- vdivnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vdivbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vdivnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vdivbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vdivnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vdivbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vdivnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vdivbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00]
- vdivnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vdivbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vdivnepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vdivbf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5e,0x10]
- vdivnepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vdivbf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vdivnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vdivbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5e,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vdivnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vdivbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vdivnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vdivbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5e,0x51,0x7f]
- vdivnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vdivbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vdivnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vdivbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5e,0x52,0x80]
- vdivnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vdivbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vfmadd132nepbf16 ymm2, ymm3, ymm4
+// CHECK: vfmadd132bf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x98,0xd4]
- vfmadd132nepbf16 ymm2, ymm3, ymm4
+ vfmadd132bf16 ymm2, ymm3, ymm4
-// CHECK: vfmadd132nepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vfmadd132bf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x98,0xd4]
- vfmadd132nepbf16 ymm2 {k7}, ymm3, ymm4
+ vfmadd132bf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vfmadd132bf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x98,0xd4]
- vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vfmadd132bf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vfmadd132nepbf16 zmm2, zmm3, zmm4
+// CHECK: vfmadd132bf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x98,0xd4]
- vfmadd132nepbf16 zmm2, zmm3, zmm4
+ vfmadd132bf16 zmm2, zmm3, zmm4
-// CHECK: vfmadd132nepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vfmadd132bf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x98,0xd4]
- vfmadd132nepbf16 zmm2 {k7}, zmm3, zmm4
+ vfmadd132bf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vfmadd132bf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x98,0xd4]
- vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vfmadd132bf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vfmadd132nepbf16 xmm2, xmm3, xmm4
+// CHECK: vfmadd132bf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x98,0xd4]
- vfmadd132nepbf16 xmm2, xmm3, xmm4
+ vfmadd132bf16 xmm2, xmm3, xmm4
-// CHECK: vfmadd132nepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vfmadd132bf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x98,0xd4]
- vfmadd132nepbf16 xmm2 {k7}, xmm3, xmm4
+ vfmadd132bf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vfmadd132bf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x98,0xd4]
- vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vfmadd132bf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vfmadd132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmadd132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x98,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vfmadd132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmadd132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vfmadd132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x98,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vfmadd132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vfmadd132nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vfmadd132bf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0x98,0x10]
- vfmadd132nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vfmadd132bf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vfmadd132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vfmadd132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x98,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfmadd132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vfmadd132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vfmadd132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x98,0x51,0x7f]
- vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vfmadd132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vfmadd132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x98,0x52,0x80]
- vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vfmadd132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vfmadd132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmadd132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x98,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vfmadd132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmadd132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vfmadd132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x98,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vfmadd132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vfmadd132nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vfmadd132bf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0x98,0x10]
- vfmadd132nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vfmadd132bf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vfmadd132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vfmadd132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x98,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfmadd132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vfmadd132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vfmadd132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x98,0x51,0x7f]
- vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vfmadd132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vfmadd132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x98,0x52,0x80]
- vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vfmadd132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vfmadd132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmadd132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x98,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vfmadd132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmadd132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vfmadd132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x98,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vfmadd132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vfmadd132nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vfmadd132bf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0x98,0x10]
- vfmadd132nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vfmadd132bf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vfmadd132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vfmadd132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x98,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfmadd132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vfmadd132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vfmadd132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x98,0x51,0x7f]
- vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vfmadd132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vfmadd132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x98,0x52,0x80]
- vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vfmadd132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vfmadd213nepbf16 ymm2, ymm3, ymm4
+// CHECK: vfmadd213bf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xa8,0xd4]
- vfmadd213nepbf16 ymm2, ymm3, ymm4
+ vfmadd213bf16 ymm2, ymm3, ymm4
-// CHECK: vfmadd213nepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vfmadd213bf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xa8,0xd4]
- vfmadd213nepbf16 ymm2 {k7}, ymm3, ymm4
+ vfmadd213bf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vfmadd213bf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xa8,0xd4]
- vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vfmadd213bf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vfmadd213nepbf16 zmm2, zmm3, zmm4
+// CHECK: vfmadd213bf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xa8,0xd4]
- vfmadd213nepbf16 zmm2, zmm3, zmm4
+ vfmadd213bf16 zmm2, zmm3, zmm4
-// CHECK: vfmadd213nepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vfmadd213bf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xa8,0xd4]
- vfmadd213nepbf16 zmm2 {k7}, zmm3, zmm4
+ vfmadd213bf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vfmadd213bf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xa8,0xd4]
- vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vfmadd213bf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vfmadd213nepbf16 xmm2, xmm3, xmm4
+// CHECK: vfmadd213bf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xa8,0xd4]
- vfmadd213nepbf16 xmm2, xmm3, xmm4
+ vfmadd213bf16 xmm2, xmm3, xmm4
-// CHECK: vfmadd213nepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vfmadd213bf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xa8,0xd4]
- vfmadd213nepbf16 xmm2 {k7}, xmm3, xmm4
+ vfmadd213bf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vfmadd213bf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xa8,0xd4]
- vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vfmadd213bf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vfmadd213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmadd213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vfmadd213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmadd213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vfmadd213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vfmadd213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vfmadd213nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vfmadd213bf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xa8,0x10]
- vfmadd213nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vfmadd213bf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vfmadd213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vfmadd213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xa8,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfmadd213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vfmadd213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vfmadd213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xa8,0x51,0x7f]
- vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vfmadd213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vfmadd213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xa8,0x52,0x80]
- vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vfmadd213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vfmadd213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmadd213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vfmadd213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmadd213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vfmadd213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vfmadd213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vfmadd213nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vfmadd213bf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xa8,0x10]
- vfmadd213nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vfmadd213bf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vfmadd213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vfmadd213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xa8,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfmadd213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vfmadd213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vfmadd213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xa8,0x51,0x7f]
- vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vfmadd213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vfmadd213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xa8,0x52,0x80]
- vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vfmadd213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vfmadd213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmadd213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vfmadd213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmadd213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vfmadd213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vfmadd213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vfmadd213nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vfmadd213bf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xa8,0x10]
- vfmadd213nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vfmadd213bf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vfmadd213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vfmadd213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xa8,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfmadd213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vfmadd213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vfmadd213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xa8,0x51,0x7f]
- vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vfmadd213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vfmadd213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xa8,0x52,0x80]
- vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vfmadd213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vfmadd231nepbf16 ymm2, ymm3, ymm4
+// CHECK: vfmadd231bf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xb8,0xd4]
- vfmadd231nepbf16 ymm2, ymm3, ymm4
+ vfmadd231bf16 ymm2, ymm3, ymm4
-// CHECK: vfmadd231nepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vfmadd231bf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xb8,0xd4]
- vfmadd231nepbf16 ymm2 {k7}, ymm3, ymm4
+ vfmadd231bf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vfmadd231bf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xb8,0xd4]
- vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vfmadd231bf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vfmadd231nepbf16 zmm2, zmm3, zmm4
+// CHECK: vfmadd231bf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xb8,0xd4]
- vfmadd231nepbf16 zmm2, zmm3, zmm4
+ vfmadd231bf16 zmm2, zmm3, zmm4
-// CHECK: vfmadd231nepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vfmadd231bf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xb8,0xd4]
- vfmadd231nepbf16 zmm2 {k7}, zmm3, zmm4
+ vfmadd231bf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vfmadd231bf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xb8,0xd4]
- vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vfmadd231bf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vfmadd231nepbf16 xmm2, xmm3, xmm4
+// CHECK: vfmadd231bf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xb8,0xd4]
- vfmadd231nepbf16 xmm2, xmm3, xmm4
+ vfmadd231bf16 xmm2, xmm3, xmm4
-// CHECK: vfmadd231nepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vfmadd231bf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xb8,0xd4]
- vfmadd231nepbf16 xmm2 {k7}, xmm3, xmm4
+ vfmadd231bf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vfmadd231bf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xb8,0xd4]
- vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vfmadd231bf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vfmadd231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmadd231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vfmadd231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmadd231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vfmadd231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vfmadd231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vfmadd231nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vfmadd231bf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xb8,0x10]
- vfmadd231nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vfmadd231bf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vfmadd231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vfmadd231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xb8,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfmadd231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vfmadd231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vfmadd231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xb8,0x51,0x7f]
- vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vfmadd231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vfmadd231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xb8,0x52,0x80]
- vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vfmadd231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vfmadd231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmadd231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vfmadd231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmadd231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vfmadd231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vfmadd231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vfmadd231nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vfmadd231bf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xb8,0x10]
- vfmadd231nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vfmadd231bf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vfmadd231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vfmadd231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xb8,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfmadd231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vfmadd231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vfmadd231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xb8,0x51,0x7f]
- vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vfmadd231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vfmadd231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xb8,0x52,0x80]
- vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vfmadd231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vfmadd231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmadd231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmadd231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vfmadd231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmadd231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vfmadd231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmadd231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vfmadd231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vfmadd231nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vfmadd231bf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xb8,0x10]
- vfmadd231nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vfmadd231bf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vfmadd231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vfmadd231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xb8,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfmadd231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vfmadd231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vfmadd231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xb8,0x51,0x7f]
- vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vfmadd231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vfmadd231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xb8,0x52,0x80]
- vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vfmadd231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vfmsub132nepbf16 ymm2, ymm3, ymm4
+// CHECK: vfmsub132bf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9a,0xd4]
- vfmsub132nepbf16 ymm2, ymm3, ymm4
+ vfmsub132bf16 ymm2, ymm3, ymm4
-// CHECK: vfmsub132nepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vfmsub132bf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9a,0xd4]
- vfmsub132nepbf16 ymm2 {k7}, ymm3, ymm4
+ vfmsub132bf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vfmsub132bf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9a,0xd4]
- vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vfmsub132bf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vfmsub132nepbf16 zmm2, zmm3, zmm4
+// CHECK: vfmsub132bf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9a,0xd4]
- vfmsub132nepbf16 zmm2, zmm3, zmm4
+ vfmsub132bf16 zmm2, zmm3, zmm4
-// CHECK: vfmsub132nepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vfmsub132bf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9a,0xd4]
- vfmsub132nepbf16 zmm2 {k7}, zmm3, zmm4
+ vfmsub132bf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vfmsub132bf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9a,0xd4]
- vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vfmsub132bf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vfmsub132nepbf16 xmm2, xmm3, xmm4
+// CHECK: vfmsub132bf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9a,0xd4]
- vfmsub132nepbf16 xmm2, xmm3, xmm4
+ vfmsub132bf16 xmm2, xmm3, xmm4
-// CHECK: vfmsub132nepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vfmsub132bf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9a,0xd4]
- vfmsub132nepbf16 xmm2 {k7}, xmm3, xmm4
+ vfmsub132bf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vfmsub132bf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9a,0xd4]
- vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vfmsub132bf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vfmsub132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmsub132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vfmsub132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmsub132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vfmsub132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vfmsub132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vfmsub132nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vfmsub132bf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0x9a,0x10]
- vfmsub132nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vfmsub132bf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vfmsub132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vfmsub132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9a,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfmsub132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vfmsub132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vfmsub132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9a,0x51,0x7f]
- vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vfmsub132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vfmsub132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x9a,0x52,0x80]
- vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vfmsub132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vfmsub132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmsub132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vfmsub132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmsub132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vfmsub132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vfmsub132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vfmsub132nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vfmsub132bf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0x9a,0x10]
- vfmsub132nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vfmsub132bf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vfmsub132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vfmsub132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9a,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfmsub132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vfmsub132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vfmsub132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9a,0x51,0x7f]
- vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vfmsub132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vfmsub132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x9a,0x52,0x80]
- vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vfmsub132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vfmsub132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmsub132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vfmsub132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmsub132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vfmsub132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vfmsub132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vfmsub132nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vfmsub132bf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0x9a,0x10]
- vfmsub132nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vfmsub132bf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vfmsub132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vfmsub132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9a,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfmsub132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vfmsub132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vfmsub132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9a,0x51,0x7f]
- vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vfmsub132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vfmsub132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x9a,0x52,0x80]
- vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vfmsub132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vfmsub213nepbf16 ymm2, ymm3, ymm4
+// CHECK: vfmsub213bf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xaa,0xd4]
- vfmsub213nepbf16 ymm2, ymm3, ymm4
+ vfmsub213bf16 ymm2, ymm3, ymm4
-// CHECK: vfmsub213nepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vfmsub213bf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xaa,0xd4]
- vfmsub213nepbf16 ymm2 {k7}, ymm3, ymm4
+ vfmsub213bf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vfmsub213bf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xaa,0xd4]
- vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vfmsub213bf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vfmsub213nepbf16 zmm2, zmm3, zmm4
+// CHECK: vfmsub213bf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xaa,0xd4]
- vfmsub213nepbf16 zmm2, zmm3, zmm4
+ vfmsub213bf16 zmm2, zmm3, zmm4
-// CHECK: vfmsub213nepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vfmsub213bf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xaa,0xd4]
- vfmsub213nepbf16 zmm2 {k7}, zmm3, zmm4
+ vfmsub213bf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vfmsub213bf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xaa,0xd4]
- vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vfmsub213bf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vfmsub213nepbf16 xmm2, xmm3, xmm4
+// CHECK: vfmsub213bf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xaa,0xd4]
- vfmsub213nepbf16 xmm2, xmm3, xmm4
+ vfmsub213bf16 xmm2, xmm3, xmm4
-// CHECK: vfmsub213nepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vfmsub213bf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xaa,0xd4]
- vfmsub213nepbf16 xmm2 {k7}, xmm3, xmm4
+ vfmsub213bf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vfmsub213bf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xaa,0xd4]
- vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vfmsub213bf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vfmsub213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmsub213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vfmsub213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmsub213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vfmsub213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vfmsub213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vfmsub213nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vfmsub213bf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xaa,0x10]
- vfmsub213nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vfmsub213bf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vfmsub213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vfmsub213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xaa,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfmsub213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vfmsub213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vfmsub213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xaa,0x51,0x7f]
- vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vfmsub213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vfmsub213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xaa,0x52,0x80]
- vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vfmsub213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vfmsub213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmsub213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vfmsub213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmsub213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vfmsub213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vfmsub213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vfmsub213nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vfmsub213bf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xaa,0x10]
- vfmsub213nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vfmsub213bf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vfmsub213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vfmsub213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xaa,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfmsub213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vfmsub213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vfmsub213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xaa,0x51,0x7f]
- vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vfmsub213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vfmsub213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xaa,0x52,0x80]
- vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vfmsub213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vfmsub213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmsub213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vfmsub213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmsub213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vfmsub213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vfmsub213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vfmsub213nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vfmsub213bf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xaa,0x10]
- vfmsub213nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vfmsub213bf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vfmsub213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vfmsub213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xaa,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfmsub213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vfmsub213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vfmsub213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xaa,0x51,0x7f]
- vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vfmsub213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vfmsub213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xaa,0x52,0x80]
- vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vfmsub213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vfmsub231nepbf16 ymm2, ymm3, ymm4
+// CHECK: vfmsub231bf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xba,0xd4]
- vfmsub231nepbf16 ymm2, ymm3, ymm4
+ vfmsub231bf16 ymm2, ymm3, ymm4
-// CHECK: vfmsub231nepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vfmsub231bf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xba,0xd4]
- vfmsub231nepbf16 ymm2 {k7}, ymm3, ymm4
+ vfmsub231bf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vfmsub231bf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xba,0xd4]
- vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vfmsub231bf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vfmsub231nepbf16 zmm2, zmm3, zmm4
+// CHECK: vfmsub231bf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xba,0xd4]
- vfmsub231nepbf16 zmm2, zmm3, zmm4
+ vfmsub231bf16 zmm2, zmm3, zmm4
-// CHECK: vfmsub231nepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vfmsub231bf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xba,0xd4]
- vfmsub231nepbf16 zmm2 {k7}, zmm3, zmm4
+ vfmsub231bf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vfmsub231bf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xba,0xd4]
- vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vfmsub231bf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vfmsub231nepbf16 xmm2, xmm3, xmm4
+// CHECK: vfmsub231bf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xba,0xd4]
- vfmsub231nepbf16 xmm2, xmm3, xmm4
+ vfmsub231bf16 xmm2, xmm3, xmm4
-// CHECK: vfmsub231nepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vfmsub231bf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xba,0xd4]
- vfmsub231nepbf16 xmm2 {k7}, xmm3, xmm4
+ vfmsub231bf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vfmsub231bf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xba,0xd4]
- vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vfmsub231bf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vfmsub231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmsub231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xba,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vfmsub231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmsub231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vfmsub231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xba,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vfmsub231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vfmsub231nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vfmsub231bf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xba,0x10]
- vfmsub231nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vfmsub231bf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vfmsub231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vfmsub231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xba,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfmsub231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vfmsub231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vfmsub231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xba,0x51,0x7f]
- vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vfmsub231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vfmsub231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xba,0x52,0x80]
- vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vfmsub231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vfmsub231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmsub231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xba,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vfmsub231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmsub231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vfmsub231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xba,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vfmsub231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vfmsub231nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vfmsub231bf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xba,0x10]
- vfmsub231nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vfmsub231bf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vfmsub231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vfmsub231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xba,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfmsub231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vfmsub231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vfmsub231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xba,0x51,0x7f]
- vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vfmsub231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vfmsub231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xba,0x52,0x80]
- vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vfmsub231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vfmsub231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfmsub231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xba,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfmsub231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vfmsub231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfmsub231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vfmsub231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xba,0x94,0x87,0x23,0x01,0x00,0x00]
- vfmsub231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vfmsub231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vfmsub231nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vfmsub231bf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xba,0x10]
- vfmsub231nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vfmsub231bf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vfmsub231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vfmsub231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xba,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfmsub231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vfmsub231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vfmsub231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xba,0x51,0x7f]
- vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vfmsub231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vfmsub231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xba,0x52,0x80]
- vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vfmsub231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vfnmadd132nepbf16 ymm2, ymm3, ymm4
+// CHECK: vfnmadd132bf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9c,0xd4]
- vfnmadd132nepbf16 ymm2, ymm3, ymm4
+ vfnmadd132bf16 ymm2, ymm3, ymm4
-// CHECK: vfnmadd132nepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vfnmadd132bf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9c,0xd4]
- vfnmadd132nepbf16 ymm2 {k7}, ymm3, ymm4
+ vfnmadd132bf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9c,0xd4]
- vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vfnmadd132bf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vfnmadd132nepbf16 zmm2, zmm3, zmm4
+// CHECK: vfnmadd132bf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9c,0xd4]
- vfnmadd132nepbf16 zmm2, zmm3, zmm4
+ vfnmadd132bf16 zmm2, zmm3, zmm4
-// CHECK: vfnmadd132nepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vfnmadd132bf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9c,0xd4]
- vfnmadd132nepbf16 zmm2 {k7}, zmm3, zmm4
+ vfnmadd132bf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9c,0xd4]
- vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vfnmadd132bf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vfnmadd132nepbf16 xmm2, xmm3, xmm4
+// CHECK: vfnmadd132bf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9c,0xd4]
- vfnmadd132nepbf16 xmm2, xmm3, xmm4
+ vfnmadd132bf16 xmm2, xmm3, xmm4
-// CHECK: vfnmadd132nepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vfnmadd132bf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9c,0xd4]
- vfnmadd132nepbf16 xmm2 {k7}, xmm3, xmm4
+ vfnmadd132bf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9c,0xd4]
- vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vfnmadd132bf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vfnmadd132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmadd132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vfnmadd132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmadd132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmadd132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vfnmadd132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmadd132nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vfnmadd132bf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0x9c,0x10]
- vfnmadd132nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vfnmadd132bf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vfnmadd132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vfnmadd132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9c,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfnmadd132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vfnmadd132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9c,0x51,0x7f]
- vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vfnmadd132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x9c,0x52,0x80]
- vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vfnmadd132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vfnmadd132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmadd132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vfnmadd132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmadd132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmadd132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vfnmadd132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmadd132nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vfnmadd132bf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0x9c,0x10]
- vfnmadd132nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vfnmadd132bf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vfnmadd132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vfnmadd132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9c,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfnmadd132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vfnmadd132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9c,0x51,0x7f]
- vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vfnmadd132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x9c,0x52,0x80]
- vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vfnmadd132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vfnmadd132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmadd132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vfnmadd132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmadd132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmadd132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vfnmadd132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmadd132nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vfnmadd132bf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0x9c,0x10]
- vfnmadd132nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vfnmadd132bf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vfnmadd132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vfnmadd132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9c,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfnmadd132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vfnmadd132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9c,0x51,0x7f]
- vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vfnmadd132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x9c,0x52,0x80]
- vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vfnmadd132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vfnmadd213nepbf16 ymm2, ymm3, ymm4
+// CHECK: vfnmadd213bf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xac,0xd4]
- vfnmadd213nepbf16 ymm2, ymm3, ymm4
+ vfnmadd213bf16 ymm2, ymm3, ymm4
-// CHECK: vfnmadd213nepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vfnmadd213bf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xac,0xd4]
- vfnmadd213nepbf16 ymm2 {k7}, ymm3, ymm4
+ vfnmadd213bf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xac,0xd4]
- vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vfnmadd213bf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vfnmadd213nepbf16 zmm2, zmm3, zmm4
+// CHECK: vfnmadd213bf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xac,0xd4]
- vfnmadd213nepbf16 zmm2, zmm3, zmm4
+ vfnmadd213bf16 zmm2, zmm3, zmm4
-// CHECK: vfnmadd213nepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vfnmadd213bf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xac,0xd4]
- vfnmadd213nepbf16 zmm2 {k7}, zmm3, zmm4
+ vfnmadd213bf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xac,0xd4]
- vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vfnmadd213bf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vfnmadd213nepbf16 xmm2, xmm3, xmm4
+// CHECK: vfnmadd213bf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xac,0xd4]
- vfnmadd213nepbf16 xmm2, xmm3, xmm4
+ vfnmadd213bf16 xmm2, xmm3, xmm4
-// CHECK: vfnmadd213nepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vfnmadd213bf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xac,0xd4]
- vfnmadd213nepbf16 xmm2 {k7}, xmm3, xmm4
+ vfnmadd213bf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xac,0xd4]
- vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vfnmadd213bf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vfnmadd213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmadd213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xac,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vfnmadd213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmadd213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmadd213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xac,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vfnmadd213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmadd213nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vfnmadd213bf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xac,0x10]
- vfnmadd213nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vfnmadd213bf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vfnmadd213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vfnmadd213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xac,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfnmadd213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vfnmadd213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xac,0x51,0x7f]
- vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vfnmadd213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xac,0x52,0x80]
- vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vfnmadd213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vfnmadd213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmadd213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xac,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vfnmadd213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmadd213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmadd213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xac,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vfnmadd213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmadd213nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vfnmadd213bf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xac,0x10]
- vfnmadd213nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vfnmadd213bf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vfnmadd213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vfnmadd213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xac,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfnmadd213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vfnmadd213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xac,0x51,0x7f]
- vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vfnmadd213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xac,0x52,0x80]
- vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vfnmadd213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vfnmadd213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmadd213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xac,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vfnmadd213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmadd213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmadd213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xac,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vfnmadd213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmadd213nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vfnmadd213bf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xac,0x10]
- vfnmadd213nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vfnmadd213bf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vfnmadd213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vfnmadd213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xac,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfnmadd213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vfnmadd213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xac,0x51,0x7f]
- vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vfnmadd213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xac,0x52,0x80]
- vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vfnmadd213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vfnmadd231nepbf16 ymm2, ymm3, ymm4
+// CHECK: vfnmadd231bf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbc,0xd4]
- vfnmadd231nepbf16 ymm2, ymm3, ymm4
+ vfnmadd231bf16 ymm2, ymm3, ymm4
-// CHECK: vfnmadd231nepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vfnmadd231bf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbc,0xd4]
- vfnmadd231nepbf16 ymm2 {k7}, ymm3, ymm4
+ vfnmadd231bf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbc,0xd4]
- vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vfnmadd231bf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vfnmadd231nepbf16 zmm2, zmm3, zmm4
+// CHECK: vfnmadd231bf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbc,0xd4]
- vfnmadd231nepbf16 zmm2, zmm3, zmm4
+ vfnmadd231bf16 zmm2, zmm3, zmm4
-// CHECK: vfnmadd231nepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vfnmadd231bf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbc,0xd4]
- vfnmadd231nepbf16 zmm2 {k7}, zmm3, zmm4
+ vfnmadd231bf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbc,0xd4]
- vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vfnmadd231bf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vfnmadd231nepbf16 xmm2, xmm3, xmm4
+// CHECK: vfnmadd231bf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbc,0xd4]
- vfnmadd231nepbf16 xmm2, xmm3, xmm4
+ vfnmadd231bf16 xmm2, xmm3, xmm4
-// CHECK: vfnmadd231nepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vfnmadd231bf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbc,0xd4]
- vfnmadd231nepbf16 xmm2 {k7}, xmm3, xmm4
+ vfnmadd231bf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbc,0xd4]
- vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vfnmadd231bf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vfnmadd231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmadd231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vfnmadd231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmadd231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmadd231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vfnmadd231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmadd231nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vfnmadd231bf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xbc,0x10]
- vfnmadd231nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vfnmadd231bf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vfnmadd231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vfnmadd231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbc,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfnmadd231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vfnmadd231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbc,0x51,0x7f]
- vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vfnmadd231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xbc,0x52,0x80]
- vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vfnmadd231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vfnmadd231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmadd231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vfnmadd231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmadd231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmadd231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vfnmadd231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmadd231nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vfnmadd231bf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xbc,0x10]
- vfnmadd231nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vfnmadd231bf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vfnmadd231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vfnmadd231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbc,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfnmadd231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vfnmadd231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbc,0x51,0x7f]
- vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vfnmadd231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xbc,0x52,0x80]
- vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vfnmadd231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vfnmadd231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmadd231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmadd231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vfnmadd231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmadd231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmadd231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmadd231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vfnmadd231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmadd231nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vfnmadd231bf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xbc,0x10]
- vfnmadd231nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vfnmadd231bf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vfnmadd231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vfnmadd231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbc,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfnmadd231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vfnmadd231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbc,0x51,0x7f]
- vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vfnmadd231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xbc,0x52,0x80]
- vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vfnmadd231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vfnmsub132nepbf16 ymm2, ymm3, ymm4
+// CHECK: vfnmsub132bf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9e,0xd4]
- vfnmsub132nepbf16 ymm2, ymm3, ymm4
+ vfnmsub132bf16 ymm2, ymm3, ymm4
-// CHECK: vfnmsub132nepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vfnmsub132bf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9e,0xd4]
- vfnmsub132nepbf16 ymm2 {k7}, ymm3, ymm4
+ vfnmsub132bf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9e,0xd4]
- vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vfnmsub132bf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vfnmsub132nepbf16 zmm2, zmm3, zmm4
+// CHECK: vfnmsub132bf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9e,0xd4]
- vfnmsub132nepbf16 zmm2, zmm3, zmm4
+ vfnmsub132bf16 zmm2, zmm3, zmm4
-// CHECK: vfnmsub132nepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vfnmsub132bf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9e,0xd4]
- vfnmsub132nepbf16 zmm2 {k7}, zmm3, zmm4
+ vfnmsub132bf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9e,0xd4]
- vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vfnmsub132bf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vfnmsub132nepbf16 xmm2, xmm3, xmm4
+// CHECK: vfnmsub132bf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9e,0xd4]
- vfnmsub132nepbf16 xmm2, xmm3, xmm4
+ vfnmsub132bf16 xmm2, xmm3, xmm4
-// CHECK: vfnmsub132nepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vfnmsub132bf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9e,0xd4]
- vfnmsub132nepbf16 xmm2 {k7}, xmm3, xmm4
+ vfnmsub132bf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9e,0xd4]
- vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vfnmsub132bf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vfnmsub132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmsub132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vfnmsub132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmsub132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmsub132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vfnmsub132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmsub132nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vfnmsub132bf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0x9e,0x10]
- vfnmsub132nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vfnmsub132bf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vfnmsub132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vfnmsub132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9e,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfnmsub132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vfnmsub132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9e,0x51,0x7f]
- vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vfnmsub132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x9e,0x52,0x80]
- vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vfnmsub132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vfnmsub132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmsub132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vfnmsub132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmsub132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmsub132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vfnmsub132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmsub132nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vfnmsub132bf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0x9e,0x10]
- vfnmsub132nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vfnmsub132bf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vfnmsub132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vfnmsub132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9e,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfnmsub132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vfnmsub132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9e,0x51,0x7f]
- vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vfnmsub132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x9e,0x52,0x80]
- vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vfnmsub132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vfnmsub132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmsub132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vfnmsub132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmsub132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmsub132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vfnmsub132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmsub132nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vfnmsub132bf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0x9e,0x10]
- vfnmsub132nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vfnmsub132bf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vfnmsub132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vfnmsub132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9e,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfnmsub132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vfnmsub132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9e,0x51,0x7f]
- vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vfnmsub132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x9e,0x52,0x80]
- vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vfnmsub132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vfnmsub213nepbf16 ymm2, ymm3, ymm4
+// CHECK: vfnmsub213bf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xae,0xd4]
- vfnmsub213nepbf16 ymm2, ymm3, ymm4
+ vfnmsub213bf16 ymm2, ymm3, ymm4
-// CHECK: vfnmsub213nepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vfnmsub213bf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xae,0xd4]
- vfnmsub213nepbf16 ymm2 {k7}, ymm3, ymm4
+ vfnmsub213bf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xae,0xd4]
- vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vfnmsub213bf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vfnmsub213nepbf16 zmm2, zmm3, zmm4
+// CHECK: vfnmsub213bf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xae,0xd4]
- vfnmsub213nepbf16 zmm2, zmm3, zmm4
+ vfnmsub213bf16 zmm2, zmm3, zmm4
-// CHECK: vfnmsub213nepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vfnmsub213bf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xae,0xd4]
- vfnmsub213nepbf16 zmm2 {k7}, zmm3, zmm4
+ vfnmsub213bf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xae,0xd4]
- vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vfnmsub213bf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vfnmsub213nepbf16 xmm2, xmm3, xmm4
+// CHECK: vfnmsub213bf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xae,0xd4]
- vfnmsub213nepbf16 xmm2, xmm3, xmm4
+ vfnmsub213bf16 xmm2, xmm3, xmm4
-// CHECK: vfnmsub213nepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vfnmsub213bf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xae,0xd4]
- vfnmsub213nepbf16 xmm2 {k7}, xmm3, xmm4
+ vfnmsub213bf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xae,0xd4]
- vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vfnmsub213bf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vfnmsub213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmsub213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xae,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vfnmsub213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmsub213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmsub213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xae,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vfnmsub213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmsub213nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vfnmsub213bf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xae,0x10]
- vfnmsub213nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vfnmsub213bf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vfnmsub213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vfnmsub213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xae,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfnmsub213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vfnmsub213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xae,0x51,0x7f]
- vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vfnmsub213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xae,0x52,0x80]
- vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vfnmsub213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vfnmsub213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmsub213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xae,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vfnmsub213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmsub213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmsub213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xae,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vfnmsub213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmsub213nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vfnmsub213bf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xae,0x10]
- vfnmsub213nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vfnmsub213bf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vfnmsub213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vfnmsub213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xae,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfnmsub213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vfnmsub213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xae,0x51,0x7f]
- vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vfnmsub213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xae,0x52,0x80]
- vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vfnmsub213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vfnmsub213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmsub213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xae,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vfnmsub213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmsub213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmsub213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xae,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vfnmsub213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmsub213nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vfnmsub213bf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xae,0x10]
- vfnmsub213nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vfnmsub213bf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vfnmsub213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vfnmsub213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xae,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfnmsub213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vfnmsub213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xae,0x51,0x7f]
- vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vfnmsub213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xae,0x52,0x80]
- vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vfnmsub213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vfnmsub231nepbf16 ymm2, ymm3, ymm4
+// CHECK: vfnmsub231bf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbe,0xd4]
- vfnmsub231nepbf16 ymm2, ymm3, ymm4
+ vfnmsub231bf16 ymm2, ymm3, ymm4
-// CHECK: vfnmsub231nepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vfnmsub231bf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbe,0xd4]
- vfnmsub231nepbf16 ymm2 {k7}, ymm3, ymm4
+ vfnmsub231bf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbe,0xd4]
- vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vfnmsub231bf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vfnmsub231nepbf16 zmm2, zmm3, zmm4
+// CHECK: vfnmsub231bf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbe,0xd4]
- vfnmsub231nepbf16 zmm2, zmm3, zmm4
+ vfnmsub231bf16 zmm2, zmm3, zmm4
-// CHECK: vfnmsub231nepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vfnmsub231bf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbe,0xd4]
- vfnmsub231nepbf16 zmm2 {k7}, zmm3, zmm4
+ vfnmsub231bf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbe,0xd4]
- vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vfnmsub231bf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vfnmsub231nepbf16 xmm2, xmm3, xmm4
+// CHECK: vfnmsub231bf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbe,0xd4]
- vfnmsub231nepbf16 xmm2, xmm3, xmm4
+ vfnmsub231bf16 xmm2, xmm3, xmm4
-// CHECK: vfnmsub231nepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vfnmsub231bf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbe,0xd4]
- vfnmsub231nepbf16 xmm2 {k7}, xmm3, xmm4
+ vfnmsub231bf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbe,0xd4]
- vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vfnmsub231bf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vfnmsub231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmsub231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vfnmsub231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmsub231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmsub231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vfnmsub231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmsub231nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vfnmsub231bf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0xbe,0x10]
- vfnmsub231nepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vfnmsub231bf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vfnmsub231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vfnmsub231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbe,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vfnmsub231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vfnmsub231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbe,0x51,0x7f]
- vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vfnmsub231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xbe,0x52,0x80]
- vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vfnmsub231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vfnmsub231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmsub231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vfnmsub231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmsub231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmsub231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vfnmsub231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmsub231nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vfnmsub231bf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0xbe,0x10]
- vfnmsub231nepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vfnmsub231bf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vfnmsub231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vfnmsub231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbe,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vfnmsub231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vfnmsub231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbe,0x51,0x7f]
- vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vfnmsub231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xbe,0x52,0x80]
- vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vfnmsub231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vfnmsub231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vfnmsub231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10]
- vfnmsub231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vfnmsub231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vfnmsub231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vfnmsub231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00]
- vfnmsub231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vfnmsub231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vfnmsub231nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vfnmsub231bf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0xbe,0x10]
- vfnmsub231nepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vfnmsub231bf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vfnmsub231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vfnmsub231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbe,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vfnmsub231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vfnmsub231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbe,0x51,0x7f]
- vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vfnmsub231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xbe,0x52,0x80]
- vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vfnmsub231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vfpclasspbf16 k5, zmm3, 123
+// CHECK: vfpclassbf16 k5, zmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x66,0xeb,0x7b]
- vfpclasspbf16 k5, zmm3, 123
+ vfpclassbf16 k5, zmm3, 123
-// CHECK: vfpclasspbf16 k5 {k7}, zmm3, 123
+// CHECK: vfpclassbf16 k5 {k7}, zmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x66,0xeb,0x7b]
- vfpclasspbf16 k5 {k7}, zmm3, 123
+ vfpclassbf16 k5 {k7}, zmm3, 123
-// CHECK: vfpclasspbf16 k5, ymm3, 123
+// CHECK: vfpclassbf16 k5, ymm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x66,0xeb,0x7b]
- vfpclasspbf16 k5, ymm3, 123
+ vfpclassbf16 k5, ymm3, 123
-// CHECK: vfpclasspbf16 k5 {k7}, ymm3, 123
+// CHECK: vfpclassbf16 k5 {k7}, ymm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x66,0xeb,0x7b]
- vfpclasspbf16 k5 {k7}, ymm3, 123
+ vfpclassbf16 k5 {k7}, ymm3, 123
-// CHECK: vfpclasspbf16 k5, xmm3, 123
+// CHECK: vfpclassbf16 k5, xmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0xeb,0x7b]
- vfpclasspbf16 k5, xmm3, 123
+ vfpclassbf16 k5, xmm3, 123
-// CHECK: vfpclasspbf16 k5 {k7}, xmm3, 123
+// CHECK: vfpclassbf16 k5 {k7}, xmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0xeb,0x7b]
- vfpclasspbf16 k5 {k7}, xmm3, 123
+ vfpclassbf16 k5 {k7}, xmm3, 123
-// CHECK: vfpclasspbf16 k5, xmmword ptr [esp + 8*esi + 268435456], 123
+// CHECK: vfpclassbf16 k5, xmmword ptr [esp + 8*esi + 268435456], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vfpclasspbf16 k5, xmmword ptr [esp + 8*esi + 268435456], 123
+ vfpclassbf16 k5, xmmword ptr [esp + 8*esi + 268435456], 123
-// CHECK: vfpclasspbf16 k5 {k7}, xmmword ptr [edi + 4*eax + 291], 123
+// CHECK: vfpclassbf16 k5 {k7}, xmmword ptr [edi + 4*eax + 291], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0xac,0x87,0x23,0x01,0x00,0x00,0x7b]
- vfpclasspbf16 k5 {k7}, xmmword ptr [edi + 4*eax + 291], 123
+ vfpclassbf16 k5 {k7}, xmmword ptr [edi + 4*eax + 291], 123
-// CHECK: vfpclasspbf16 k5, word ptr [eax]{1to8}, 123
+// CHECK: vfpclassbf16 k5, word ptr [eax]{1to8}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x66,0x28,0x7b]
- vfpclasspbf16 k5, word ptr [eax]{1to8}, 123
+ vfpclassbf16 k5, word ptr [eax]{1to8}, 123
-// CHECK: vfpclasspbf16 k5, xmmword ptr [2*ebp - 512], 123
+// CHECK: vfpclassbf16 k5, xmmword ptr [2*ebp - 512], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vfpclasspbf16 k5, xmmword ptr [2*ebp - 512], 123
+ vfpclassbf16 k5, xmmword ptr [2*ebp - 512], 123
-// CHECK: vfpclasspbf16 k5 {k7}, xmmword ptr [ecx + 2032], 123
+// CHECK: vfpclassbf16 k5 {k7}, xmmword ptr [ecx + 2032], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0x69,0x7f,0x7b]
- vfpclasspbf16 k5 {k7}, xmmword ptr [ecx + 2032], 123
+ vfpclassbf16 k5 {k7}, xmmword ptr [ecx + 2032], 123
-// CHECK: vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to8}, 123
+// CHECK: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to8}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x1f,0x66,0x6a,0x80,0x7b]
- vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to8}, 123
+ vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to8}, 123
-// CHECK: vfpclasspbf16 k5, word ptr [eax]{1to16}, 123
+// CHECK: vfpclassbf16 k5, word ptr [eax]{1to16}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x66,0x28,0x7b]
- vfpclasspbf16 k5, word ptr [eax]{1to16}, 123
+ vfpclassbf16 k5, word ptr [eax]{1to16}, 123
-// CHECK: vfpclasspbf16 k5, ymmword ptr [2*ebp - 1024], 123
+// CHECK: vfpclassbf16 k5, ymmword ptr [2*ebp - 1024], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x66,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vfpclasspbf16 k5, ymmword ptr [2*ebp - 1024], 123
+ vfpclassbf16 k5, ymmword ptr [2*ebp - 1024], 123
-// CHECK: vfpclasspbf16 k5 {k7}, ymmword ptr [ecx + 4064], 123
+// CHECK: vfpclassbf16 k5 {k7}, ymmword ptr [ecx + 4064], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x66,0x69,0x7f,0x7b]
- vfpclasspbf16 k5 {k7}, ymmword ptr [ecx + 4064], 123
+ vfpclassbf16 k5 {k7}, ymmword ptr [ecx + 4064], 123
-// CHECK: vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to16}, 123
+// CHECK: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to16}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x3f,0x66,0x6a,0x80,0x7b]
- vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to16}, 123
+ vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to16}, 123
-// CHECK: vfpclasspbf16 k5, word ptr [eax]{1to32}, 123
+// CHECK: vfpclassbf16 k5, word ptr [eax]{1to32}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x66,0x28,0x7b]
- vfpclasspbf16 k5, word ptr [eax]{1to32}, 123
+ vfpclassbf16 k5, word ptr [eax]{1to32}, 123
-// CHECK: vfpclasspbf16 k5, zmmword ptr [2*ebp - 2048], 123
+// CHECK: vfpclassbf16 k5, zmmword ptr [2*ebp - 2048], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x66,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vfpclasspbf16 k5, zmmword ptr [2*ebp - 2048], 123
+ vfpclassbf16 k5, zmmword ptr [2*ebp - 2048], 123
-// CHECK: vfpclasspbf16 k5 {k7}, zmmword ptr [ecx + 8128], 123
+// CHECK: vfpclassbf16 k5 {k7}, zmmword ptr [ecx + 8128], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x66,0x69,0x7f,0x7b]
- vfpclasspbf16 k5 {k7}, zmmword ptr [ecx + 8128], 123
+ vfpclassbf16 k5 {k7}, zmmword ptr [ecx + 8128], 123
-// CHECK: vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to32}, 123
+// CHECK: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to32}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x5f,0x66,0x6a,0x80,0x7b]
- vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to32}, 123
+ vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to32}, 123
-// CHECK: vgetexppbf16 xmm2, xmm3
+// CHECK: vgetexpbf16 xmm2, xmm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x42,0xd3]
- vgetexppbf16 xmm2, xmm3
+ vgetexpbf16 xmm2, xmm3
-// CHECK: vgetexppbf16 xmm2 {k7}, xmm3
+// CHECK: vgetexpbf16 xmm2 {k7}, xmm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x42,0xd3]
- vgetexppbf16 xmm2 {k7}, xmm3
+ vgetexpbf16 xmm2 {k7}, xmm3
-// CHECK: vgetexppbf16 xmm2 {k7} {z}, xmm3
+// CHECK: vgetexpbf16 xmm2 {k7} {z}, xmm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x42,0xd3]
- vgetexppbf16 xmm2 {k7} {z}, xmm3
+ vgetexpbf16 xmm2 {k7} {z}, xmm3
-// CHECK: vgetexppbf16 zmm2, zmm3
+// CHECK: vgetexpbf16 zmm2, zmm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x42,0xd3]
- vgetexppbf16 zmm2, zmm3
+ vgetexpbf16 zmm2, zmm3
-// CHECK: vgetexppbf16 zmm2 {k7}, zmm3
+// CHECK: vgetexpbf16 zmm2 {k7}, zmm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x42,0xd3]
- vgetexppbf16 zmm2 {k7}, zmm3
+ vgetexpbf16 zmm2 {k7}, zmm3
-// CHECK: vgetexppbf16 zmm2 {k7} {z}, zmm3
+// CHECK: vgetexpbf16 zmm2 {k7} {z}, zmm3
// CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x42,0xd3]
- vgetexppbf16 zmm2 {k7} {z}, zmm3
+ vgetexpbf16 zmm2 {k7} {z}, zmm3
-// CHECK: vgetexppbf16 ymm2, ymm3
+// CHECK: vgetexpbf16 ymm2, ymm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x42,0xd3]
- vgetexppbf16 ymm2, ymm3
+ vgetexpbf16 ymm2, ymm3
-// CHECK: vgetexppbf16 ymm2 {k7}, ymm3
+// CHECK: vgetexpbf16 ymm2 {k7}, ymm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x42,0xd3]
- vgetexppbf16 ymm2 {k7}, ymm3
+ vgetexpbf16 ymm2 {k7}, ymm3
-// CHECK: vgetexppbf16 ymm2 {k7} {z}, ymm3
+// CHECK: vgetexpbf16 ymm2 {k7} {z}, ymm3
// CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x42,0xd3]
- vgetexppbf16 ymm2 {k7} {z}, ymm3
+ vgetexpbf16 ymm2 {k7} {z}, ymm3
-// CHECK: vgetexppbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vgetexpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x42,0x94,0xf4,0x00,0x00,0x00,0x10]
- vgetexppbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
+ vgetexpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vgetexppbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vgetexpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x42,0x94,0x87,0x23,0x01,0x00,0x00]
- vgetexppbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
+ vgetexpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vgetexppbf16 xmm2, word ptr [eax]{1to8}
+// CHECK: vgetexpbf16 xmm2, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf5,0x7d,0x18,0x42,0x10]
- vgetexppbf16 xmm2, word ptr [eax]{1to8}
+ vgetexpbf16 xmm2, word ptr [eax]{1to8}
-// CHECK: vgetexppbf16 xmm2, xmmword ptr [2*ebp - 512]
+// CHECK: vgetexpbf16 xmm2, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x42,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vgetexppbf16 xmm2, xmmword ptr [2*ebp - 512]
+ vgetexpbf16 xmm2, xmmword ptr [2*ebp - 512]
-// CHECK: vgetexppbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
+// CHECK: vgetexpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x42,0x51,0x7f]
- vgetexppbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
+ vgetexpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
-// CHECK: vgetexppbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
+// CHECK: vgetexpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf5,0x7d,0x9f,0x42,0x52,0x80]
- vgetexppbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
+ vgetexpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
-// CHECK: vgetexppbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vgetexpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x42,0x94,0xf4,0x00,0x00,0x00,0x10]
- vgetexppbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
+ vgetexpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vgetexppbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vgetexpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x42,0x94,0x87,0x23,0x01,0x00,0x00]
- vgetexppbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
+ vgetexpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vgetexppbf16 ymm2, word ptr [eax]{1to16}
+// CHECK: vgetexpbf16 ymm2, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf5,0x7d,0x38,0x42,0x10]
- vgetexppbf16 ymm2, word ptr [eax]{1to16}
+ vgetexpbf16 ymm2, word ptr [eax]{1to16}
-// CHECK: vgetexppbf16 ymm2, ymmword ptr [2*ebp - 1024]
+// CHECK: vgetexpbf16 ymm2, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x42,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vgetexppbf16 ymm2, ymmword ptr [2*ebp - 1024]
+ vgetexpbf16 ymm2, ymmword ptr [2*ebp - 1024]
-// CHECK: vgetexppbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
+// CHECK: vgetexpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x42,0x51,0x7f]
- vgetexppbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
+ vgetexpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
-// CHECK: vgetexppbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
+// CHECK: vgetexpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf5,0x7d,0xbf,0x42,0x52,0x80]
- vgetexppbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
+ vgetexpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
-// CHECK: vgetexppbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vgetexpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x42,0x94,0xf4,0x00,0x00,0x00,0x10]
- vgetexppbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
+ vgetexpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vgetexppbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vgetexpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x42,0x94,0x87,0x23,0x01,0x00,0x00]
- vgetexppbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
+ vgetexpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vgetexppbf16 zmm2, word ptr [eax]{1to32}
+// CHECK: vgetexpbf16 zmm2, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf5,0x7d,0x58,0x42,0x10]
- vgetexppbf16 zmm2, word ptr [eax]{1to32}
+ vgetexpbf16 zmm2, word ptr [eax]{1to32}
-// CHECK: vgetexppbf16 zmm2, zmmword ptr [2*ebp - 2048]
+// CHECK: vgetexpbf16 zmm2, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x42,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vgetexppbf16 zmm2, zmmword ptr [2*ebp - 2048]
+ vgetexpbf16 zmm2, zmmword ptr [2*ebp - 2048]
-// CHECK: vgetexppbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
+// CHECK: vgetexpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x42,0x51,0x7f]
- vgetexppbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
+ vgetexpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
-// CHECK: vgetexppbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
+// CHECK: vgetexpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf5,0x7d,0xdf,0x42,0x52,0x80]
- vgetexppbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
+ vgetexpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
-// CHECK: vgetmantpbf16 zmm2, zmm3, 123
+// CHECK: vgetmantbf16 zmm2, zmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x26,0xd3,0x7b]
- vgetmantpbf16 zmm2, zmm3, 123
+ vgetmantbf16 zmm2, zmm3, 123
-// CHECK: vgetmantpbf16 zmm2 {k7}, zmm3, 123
+// CHECK: vgetmantbf16 zmm2 {k7}, zmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x26,0xd3,0x7b]
- vgetmantpbf16 zmm2 {k7}, zmm3, 123
+ vgetmantbf16 zmm2 {k7}, zmm3, 123
-// CHECK: vgetmantpbf16 zmm2 {k7} {z}, zmm3, 123
+// CHECK: vgetmantbf16 zmm2 {k7} {z}, zmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x26,0xd3,0x7b]
- vgetmantpbf16 zmm2 {k7} {z}, zmm3, 123
+ vgetmantbf16 zmm2 {k7} {z}, zmm3, 123
-// CHECK: vgetmantpbf16 ymm2, ymm3, 123
+// CHECK: vgetmantbf16 ymm2, ymm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x26,0xd3,0x7b]
- vgetmantpbf16 ymm2, ymm3, 123
+ vgetmantbf16 ymm2, ymm3, 123
-// CHECK: vgetmantpbf16 ymm2 {k7}, ymm3, 123
+// CHECK: vgetmantbf16 ymm2 {k7}, ymm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x26,0xd3,0x7b]
- vgetmantpbf16 ymm2 {k7}, ymm3, 123
+ vgetmantbf16 ymm2 {k7}, ymm3, 123
-// CHECK: vgetmantpbf16 ymm2 {k7} {z}, ymm3, 123
+// CHECK: vgetmantbf16 ymm2 {k7} {z}, ymm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x26,0xd3,0x7b]
- vgetmantpbf16 ymm2 {k7} {z}, ymm3, 123
+ vgetmantbf16 ymm2 {k7} {z}, ymm3, 123
-// CHECK: vgetmantpbf16 xmm2, xmm3, 123
+// CHECK: vgetmantbf16 xmm2, xmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x26,0xd3,0x7b]
- vgetmantpbf16 xmm2, xmm3, 123
+ vgetmantbf16 xmm2, xmm3, 123
-// CHECK: vgetmantpbf16 xmm2 {k7}, xmm3, 123
+// CHECK: vgetmantbf16 xmm2 {k7}, xmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x26,0xd3,0x7b]
- vgetmantpbf16 xmm2 {k7}, xmm3, 123
+ vgetmantbf16 xmm2 {k7}, xmm3, 123
-// CHECK: vgetmantpbf16 xmm2 {k7} {z}, xmm3, 123
+// CHECK: vgetmantbf16 xmm2 {k7} {z}, xmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x26,0xd3,0x7b]
- vgetmantpbf16 xmm2 {k7} {z}, xmm3, 123
+ vgetmantbf16 xmm2 {k7} {z}, xmm3, 123
-// CHECK: vgetmantpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
+// CHECK: vgetmantbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vgetmantpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
+ vgetmantbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
-// CHECK: vgetmantpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
+// CHECK: vgetmantbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vgetmantpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
+ vgetmantbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
-// CHECK: vgetmantpbf16 xmm2, word ptr [eax]{1to8}, 123
+// CHECK: vgetmantbf16 xmm2, word ptr [eax]{1to8}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x26,0x10,0x7b]
- vgetmantpbf16 xmm2, word ptr [eax]{1to8}, 123
+ vgetmantbf16 xmm2, word ptr [eax]{1to8}, 123
-// CHECK: vgetmantpbf16 xmm2, xmmword ptr [2*ebp - 512], 123
+// CHECK: vgetmantbf16 xmm2, xmmword ptr [2*ebp - 512], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x26,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vgetmantpbf16 xmm2, xmmword ptr [2*ebp - 512], 123
+ vgetmantbf16 xmm2, xmmword ptr [2*ebp - 512], 123
-// CHECK: vgetmantpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
+// CHECK: vgetmantbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x26,0x51,0x7f,0x7b]
- vgetmantpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
+ vgetmantbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
-// CHECK: vgetmantpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
+// CHECK: vgetmantbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x9f,0x26,0x52,0x80,0x7b]
- vgetmantpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
+ vgetmantbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
-// CHECK: vgetmantpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
+// CHECK: vgetmantbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vgetmantpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
+ vgetmantbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
-// CHECK: vgetmantpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
+// CHECK: vgetmantbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vgetmantpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
+ vgetmantbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
-// CHECK: vgetmantpbf16 ymm2, word ptr [eax]{1to16}, 123
+// CHECK: vgetmantbf16 ymm2, word ptr [eax]{1to16}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x26,0x10,0x7b]
- vgetmantpbf16 ymm2, word ptr [eax]{1to16}, 123
+ vgetmantbf16 ymm2, word ptr [eax]{1to16}, 123
-// CHECK: vgetmantpbf16 ymm2, ymmword ptr [2*ebp - 1024], 123
+// CHECK: vgetmantbf16 ymm2, ymmword ptr [2*ebp - 1024], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x26,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vgetmantpbf16 ymm2, ymmword ptr [2*ebp - 1024], 123
+ vgetmantbf16 ymm2, ymmword ptr [2*ebp - 1024], 123
-// CHECK: vgetmantpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
+// CHECK: vgetmantbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x26,0x51,0x7f,0x7b]
- vgetmantpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
+ vgetmantbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
-// CHECK: vgetmantpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
+// CHECK: vgetmantbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xbf,0x26,0x52,0x80,0x7b]
- vgetmantpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
+ vgetmantbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
-// CHECK: vgetmantpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
+// CHECK: vgetmantbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vgetmantpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
+ vgetmantbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
-// CHECK: vgetmantpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
+// CHECK: vgetmantbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vgetmantpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
+ vgetmantbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
-// CHECK: vgetmantpbf16 zmm2, word ptr [eax]{1to32}, 123
+// CHECK: vgetmantbf16 zmm2, word ptr [eax]{1to32}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x26,0x10,0x7b]
- vgetmantpbf16 zmm2, word ptr [eax]{1to32}, 123
+ vgetmantbf16 zmm2, word ptr [eax]{1to32}, 123
-// CHECK: vgetmantpbf16 zmm2, zmmword ptr [2*ebp - 2048], 123
+// CHECK: vgetmantbf16 zmm2, zmmword ptr [2*ebp - 2048], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x26,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vgetmantpbf16 zmm2, zmmword ptr [2*ebp - 2048], 123
+ vgetmantbf16 zmm2, zmmword ptr [2*ebp - 2048], 123
-// CHECK: vgetmantpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
+// CHECK: vgetmantbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x26,0x51,0x7f,0x7b]
- vgetmantpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
+ vgetmantbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
-// CHECK: vgetmantpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
+// CHECK: vgetmantbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xdf,0x26,0x52,0x80,0x7b]
- vgetmantpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
+ vgetmantbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
-// CHECK: vmaxpbf16 ymm2, ymm3, ymm4
+// CHECK: vmaxbf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5f,0xd4]
- vmaxpbf16 ymm2, ymm3, ymm4
+ vmaxbf16 ymm2, ymm3, ymm4
-// CHECK: vmaxpbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vmaxbf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5f,0xd4]
- vmaxpbf16 ymm2 {k7}, ymm3, ymm4
+ vmaxbf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vmaxpbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vmaxbf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5f,0xd4]
- vmaxpbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vmaxbf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vmaxpbf16 zmm2, zmm3, zmm4
+// CHECK: vmaxbf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5f,0xd4]
- vmaxpbf16 zmm2, zmm3, zmm4
+ vmaxbf16 zmm2, zmm3, zmm4
-// CHECK: vmaxpbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vmaxbf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5f,0xd4]
- vmaxpbf16 zmm2 {k7}, zmm3, zmm4
+ vmaxbf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vmaxpbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vmaxbf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5f,0xd4]
- vmaxpbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vmaxbf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vmaxpbf16 xmm2, xmm3, xmm4
+// CHECK: vmaxbf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5f,0xd4]
- vmaxpbf16 xmm2, xmm3, xmm4
+ vmaxbf16 xmm2, xmm3, xmm4
-// CHECK: vmaxpbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vmaxbf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5f,0xd4]
- vmaxpbf16 xmm2 {k7}, xmm3, xmm4
+ vmaxbf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vmaxpbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vmaxbf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5f,0xd4]
- vmaxpbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vmaxbf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vmaxpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vmaxbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10]
- vmaxpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vmaxbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vmaxpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vmaxbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00]
- vmaxpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vmaxbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vmaxpbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vmaxbf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5f,0x10]
- vmaxpbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vmaxbf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vmaxpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vmaxbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5f,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vmaxpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vmaxbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vmaxpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vmaxbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5f,0x51,0x7f]
- vmaxpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vmaxbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vmaxpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vmaxbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5f,0x52,0x80]
- vmaxpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vmaxbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vmaxpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vmaxbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10]
- vmaxpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vmaxbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vmaxpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vmaxbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00]
- vmaxpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vmaxbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vmaxpbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vmaxbf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5f,0x10]
- vmaxpbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vmaxbf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vmaxpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vmaxbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5f,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vmaxpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vmaxbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vmaxpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vmaxbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5f,0x51,0x7f]
- vmaxpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vmaxbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vmaxpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vmaxbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5f,0x52,0x80]
- vmaxpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vmaxbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vmaxpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vmaxbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10]
- vmaxpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vmaxbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vmaxpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vmaxbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00]
- vmaxpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vmaxbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vmaxpbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vmaxbf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5f,0x10]
- vmaxpbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vmaxbf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vmaxpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vmaxbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5f,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vmaxpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vmaxbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vmaxpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vmaxbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5f,0x51,0x7f]
- vmaxpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vmaxbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vmaxpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vmaxbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5f,0x52,0x80]
- vmaxpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vmaxbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vminpbf16 ymm2, ymm3, ymm4
+// CHECK: vminbf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5d,0xd4]
- vminpbf16 ymm2, ymm3, ymm4
+ vminbf16 ymm2, ymm3, ymm4
-// CHECK: vminpbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vminbf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5d,0xd4]
- vminpbf16 ymm2 {k7}, ymm3, ymm4
+ vminbf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vminpbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vminbf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5d,0xd4]
- vminpbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vminbf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vminpbf16 zmm2, zmm3, zmm4
+// CHECK: vminbf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5d,0xd4]
- vminpbf16 zmm2, zmm3, zmm4
+ vminbf16 zmm2, zmm3, zmm4
-// CHECK: vminpbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vminbf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5d,0xd4]
- vminpbf16 zmm2 {k7}, zmm3, zmm4
+ vminbf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vminpbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vminbf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5d,0xd4]
- vminpbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vminbf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vminpbf16 xmm2, xmm3, xmm4
+// CHECK: vminbf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5d,0xd4]
- vminpbf16 xmm2, xmm3, xmm4
+ vminbf16 xmm2, xmm3, xmm4
-// CHECK: vminpbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vminbf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5d,0xd4]
- vminpbf16 xmm2 {k7}, xmm3, xmm4
+ vminbf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vminpbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vminbf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5d,0xd4]
- vminpbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vminbf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vminpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vminbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10]
- vminpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vminbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vminpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vminbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00]
- vminpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vminbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vminpbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vminbf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5d,0x10]
- vminpbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vminbf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vminpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vminbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5d,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vminpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vminbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vminpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vminbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5d,0x51,0x7f]
- vminpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vminbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vminpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vminbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5d,0x52,0x80]
- vminpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vminbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vminpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vminbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10]
- vminpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vminbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vminpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vminbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00]
- vminpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vminbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vminpbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vminbf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5d,0x10]
- vminpbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vminbf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vminpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vminbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5d,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vminpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vminbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vminpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vminbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5d,0x51,0x7f]
- vminpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vminbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vminpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vminbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5d,0x52,0x80]
- vminpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vminbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vminpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vminbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10]
- vminpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vminbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vminpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vminbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00]
- vminpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vminbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vminpbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vminbf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5d,0x10]
- vminpbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vminbf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vminpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vminbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5d,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vminpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vminbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vminpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vminbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5d,0x51,0x7f]
- vminpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vminbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vminpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vminbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5d,0x52,0x80]
- vminpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vminbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vmulnepbf16 ymm2, ymm3, ymm4
+// CHECK: vmulbf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x59,0xd4]
- vmulnepbf16 ymm2, ymm3, ymm4
+ vmulbf16 ymm2, ymm3, ymm4
-// CHECK: vmulnepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vmulbf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x59,0xd4]
- vmulnepbf16 ymm2 {k7}, ymm3, ymm4
+ vmulbf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vmulnepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vmulbf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x59,0xd4]
- vmulnepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vmulbf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vmulnepbf16 zmm2, zmm3, zmm4
+// CHECK: vmulbf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x59,0xd4]
- vmulnepbf16 zmm2, zmm3, zmm4
+ vmulbf16 zmm2, zmm3, zmm4
-// CHECK: vmulnepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vmulbf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x59,0xd4]
- vmulnepbf16 zmm2 {k7}, zmm3, zmm4
+ vmulbf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vmulnepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vmulbf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x59,0xd4]
- vmulnepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vmulbf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vmulnepbf16 xmm2, xmm3, xmm4
+// CHECK: vmulbf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x59,0xd4]
- vmulnepbf16 xmm2, xmm3, xmm4
+ vmulbf16 xmm2, xmm3, xmm4
-// CHECK: vmulnepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vmulbf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x59,0xd4]
- vmulnepbf16 xmm2 {k7}, xmm3, xmm4
+ vmulbf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vmulnepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vmulbf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x59,0xd4]
- vmulnepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vmulbf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vmulnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vmulbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x59,0x94,0xf4,0x00,0x00,0x00,0x10]
- vmulnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vmulbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vmulnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vmulbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x59,0x94,0x87,0x23,0x01,0x00,0x00]
- vmulnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vmulbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vmulnepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vmulbf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf5,0x65,0x58,0x59,0x10]
- vmulnepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vmulbf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vmulnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vmulbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x59,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vmulnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vmulbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vmulnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vmulbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x59,0x51,0x7f]
- vmulnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vmulbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vmulnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vmulbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x59,0x52,0x80]
- vmulnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vmulbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vmulnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vmulbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x59,0x94,0xf4,0x00,0x00,0x00,0x10]
- vmulnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vmulbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vmulnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vmulbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x59,0x94,0x87,0x23,0x01,0x00,0x00]
- vmulnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vmulbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vmulnepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vmulbf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf5,0x65,0x38,0x59,0x10]
- vmulnepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vmulbf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vmulnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vmulbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x59,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vmulnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vmulbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vmulnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vmulbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x59,0x51,0x7f]
- vmulnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vmulbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vmulnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vmulbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x59,0x52,0x80]
- vmulnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vmulbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vmulnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vmulbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x59,0x94,0xf4,0x00,0x00,0x00,0x10]
- vmulnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vmulbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vmulnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vmulbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x59,0x94,0x87,0x23,0x01,0x00,0x00]
- vmulnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vmulbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vmulnepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vmulbf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf5,0x65,0x18,0x59,0x10]
- vmulnepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vmulbf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vmulnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vmulbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x59,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vmulnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vmulbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vmulnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vmulbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x59,0x51,0x7f]
- vmulnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vmulbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vmulnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vmulbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x59,0x52,0x80]
- vmulnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vmulbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vrcppbf16 xmm2, xmm3
+// CHECK: vrcpbf16 xmm2, xmm3
// CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4c,0xd3]
- vrcppbf16 xmm2, xmm3
+ vrcpbf16 xmm2, xmm3
-// CHECK: vrcppbf16 xmm2 {k7}, xmm3
+// CHECK: vrcpbf16 xmm2 {k7}, xmm3
// CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4c,0xd3]
- vrcppbf16 xmm2 {k7}, xmm3
+ vrcpbf16 xmm2 {k7}, xmm3
-// CHECK: vrcppbf16 xmm2 {k7} {z}, xmm3
+// CHECK: vrcpbf16 xmm2 {k7} {z}, xmm3
// CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4c,0xd3]
- vrcppbf16 xmm2 {k7} {z}, xmm3
+ vrcpbf16 xmm2 {k7} {z}, xmm3
-// CHECK: vrcppbf16 zmm2, zmm3
+// CHECK: vrcpbf16 zmm2, zmm3
// CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4c,0xd3]
- vrcppbf16 zmm2, zmm3
+ vrcpbf16 zmm2, zmm3
-// CHECK: vrcppbf16 zmm2 {k7}, zmm3
+// CHECK: vrcpbf16 zmm2 {k7}, zmm3
// CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4c,0xd3]
- vrcppbf16 zmm2 {k7}, zmm3
+ vrcpbf16 zmm2 {k7}, zmm3
-// CHECK: vrcppbf16 zmm2 {k7} {z}, zmm3
+// CHECK: vrcpbf16 zmm2 {k7} {z}, zmm3
// CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4c,0xd3]
- vrcppbf16 zmm2 {k7} {z}, zmm3
+ vrcpbf16 zmm2 {k7} {z}, zmm3
-// CHECK: vrcppbf16 ymm2, ymm3
+// CHECK: vrcpbf16 ymm2, ymm3
// CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4c,0xd3]
- vrcppbf16 ymm2, ymm3
+ vrcpbf16 ymm2, ymm3
-// CHECK: vrcppbf16 ymm2 {k7}, ymm3
+// CHECK: vrcpbf16 ymm2 {k7}, ymm3
// CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4c,0xd3]
- vrcppbf16 ymm2 {k7}, ymm3
+ vrcpbf16 ymm2 {k7}, ymm3
-// CHECK: vrcppbf16 ymm2 {k7} {z}, ymm3
+// CHECK: vrcpbf16 ymm2 {k7} {z}, ymm3
// CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4c,0xd3]
- vrcppbf16 ymm2 {k7} {z}, ymm3
+ vrcpbf16 ymm2 {k7} {z}, ymm3
-// CHECK: vrcppbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vrcpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vrcppbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
+ vrcpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vrcppbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vrcpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00]
- vrcppbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
+ vrcpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vrcppbf16 xmm2, word ptr [eax]{1to8}
+// CHECK: vrcpbf16 xmm2, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x7c,0x18,0x4c,0x10]
- vrcppbf16 xmm2, word ptr [eax]{1to8}
+ vrcpbf16 xmm2, word ptr [eax]{1to8}
-// CHECK: vrcppbf16 xmm2, xmmword ptr [2*ebp - 512]
+// CHECK: vrcpbf16 xmm2, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4c,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vrcppbf16 xmm2, xmmword ptr [2*ebp - 512]
+ vrcpbf16 xmm2, xmmword ptr [2*ebp - 512]
-// CHECK: vrcppbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
+// CHECK: vrcpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4c,0x51,0x7f]
- vrcppbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
+ vrcpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
-// CHECK: vrcppbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
+// CHECK: vrcpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x7c,0x9f,0x4c,0x52,0x80]
- vrcppbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
+ vrcpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
-// CHECK: vrcppbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vrcpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vrcppbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
+ vrcpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vrcppbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vrcpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00]
- vrcppbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
+ vrcpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vrcppbf16 ymm2, word ptr [eax]{1to16}
+// CHECK: vrcpbf16 ymm2, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x7c,0x38,0x4c,0x10]
- vrcppbf16 ymm2, word ptr [eax]{1to16}
+ vrcpbf16 ymm2, word ptr [eax]{1to16}
-// CHECK: vrcppbf16 ymm2, ymmword ptr [2*ebp - 1024]
+// CHECK: vrcpbf16 ymm2, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4c,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vrcppbf16 ymm2, ymmword ptr [2*ebp - 1024]
+ vrcpbf16 ymm2, ymmword ptr [2*ebp - 1024]
-// CHECK: vrcppbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
+// CHECK: vrcpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4c,0x51,0x7f]
- vrcppbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
+ vrcpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
-// CHECK: vrcppbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
+// CHECK: vrcpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x7c,0xbf,0x4c,0x52,0x80]
- vrcppbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
+ vrcpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
-// CHECK: vrcppbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vrcpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vrcppbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
+ vrcpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vrcppbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vrcpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00]
- vrcppbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
+ vrcpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vrcppbf16 zmm2, word ptr [eax]{1to32}
+// CHECK: vrcpbf16 zmm2, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x7c,0x58,0x4c,0x10]
- vrcppbf16 zmm2, word ptr [eax]{1to32}
+ vrcpbf16 zmm2, word ptr [eax]{1to32}
-// CHECK: vrcppbf16 zmm2, zmmword ptr [2*ebp - 2048]
+// CHECK: vrcpbf16 zmm2, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4c,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vrcppbf16 zmm2, zmmword ptr [2*ebp - 2048]
+ vrcpbf16 zmm2, zmmword ptr [2*ebp - 2048]
-// CHECK: vrcppbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
+// CHECK: vrcpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4c,0x51,0x7f]
- vrcppbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
+ vrcpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
-// CHECK: vrcppbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
+// CHECK: vrcpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x7c,0xdf,0x4c,0x52,0x80]
- vrcppbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
+ vrcpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
-// CHECK: vreducenepbf16 zmm2, zmm3, 123
+// CHECK: vreducebf16 zmm2, zmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x56,0xd3,0x7b]
- vreducenepbf16 zmm2, zmm3, 123
+ vreducebf16 zmm2, zmm3, 123
-// CHECK: vreducenepbf16 zmm2 {k7}, zmm3, 123
+// CHECK: vreducebf16 zmm2 {k7}, zmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x56,0xd3,0x7b]
- vreducenepbf16 zmm2 {k7}, zmm3, 123
+ vreducebf16 zmm2 {k7}, zmm3, 123
-// CHECK: vreducenepbf16 zmm2 {k7} {z}, zmm3, 123
+// CHECK: vreducebf16 zmm2 {k7} {z}, zmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x56,0xd3,0x7b]
- vreducenepbf16 zmm2 {k7} {z}, zmm3, 123
+ vreducebf16 zmm2 {k7} {z}, zmm3, 123
-// CHECK: vreducenepbf16 ymm2, ymm3, 123
+// CHECK: vreducebf16 ymm2, ymm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x56,0xd3,0x7b]
- vreducenepbf16 ymm2, ymm3, 123
+ vreducebf16 ymm2, ymm3, 123
-// CHECK: vreducenepbf16 ymm2 {k7}, ymm3, 123
+// CHECK: vreducebf16 ymm2 {k7}, ymm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x56,0xd3,0x7b]
- vreducenepbf16 ymm2 {k7}, ymm3, 123
+ vreducebf16 ymm2 {k7}, ymm3, 123
-// CHECK: vreducenepbf16 ymm2 {k7} {z}, ymm3, 123
+// CHECK: vreducebf16 ymm2 {k7} {z}, ymm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x56,0xd3,0x7b]
- vreducenepbf16 ymm2 {k7} {z}, ymm3, 123
+ vreducebf16 ymm2 {k7} {z}, ymm3, 123
-// CHECK: vreducenepbf16 xmm2, xmm3, 123
+// CHECK: vreducebf16 xmm2, xmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x56,0xd3,0x7b]
- vreducenepbf16 xmm2, xmm3, 123
+ vreducebf16 xmm2, xmm3, 123
-// CHECK: vreducenepbf16 xmm2 {k7}, xmm3, 123
+// CHECK: vreducebf16 xmm2 {k7}, xmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x56,0xd3,0x7b]
- vreducenepbf16 xmm2 {k7}, xmm3, 123
+ vreducebf16 xmm2 {k7}, xmm3, 123
-// CHECK: vreducenepbf16 xmm2 {k7} {z}, xmm3, 123
+// CHECK: vreducebf16 xmm2 {k7} {z}, xmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x56,0xd3,0x7b]
- vreducenepbf16 xmm2 {k7} {z}, xmm3, 123
+ vreducebf16 xmm2 {k7} {z}, xmm3, 123
-// CHECK: vreducenepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
+// CHECK: vreducebf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vreducenepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
+ vreducebf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
-// CHECK: vreducenepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
+// CHECK: vreducebf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vreducenepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
+ vreducebf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
-// CHECK: vreducenepbf16 xmm2, word ptr [eax]{1to8}, 123
+// CHECK: vreducebf16 xmm2, word ptr [eax]{1to8}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x56,0x10,0x7b]
- vreducenepbf16 xmm2, word ptr [eax]{1to8}, 123
+ vreducebf16 xmm2, word ptr [eax]{1to8}, 123
-// CHECK: vreducenepbf16 xmm2, xmmword ptr [2*ebp - 512], 123
+// CHECK: vreducebf16 xmm2, xmmword ptr [2*ebp - 512], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x56,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vreducenepbf16 xmm2, xmmword ptr [2*ebp - 512], 123
+ vreducebf16 xmm2, xmmword ptr [2*ebp - 512], 123
-// CHECK: vreducenepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
+// CHECK: vreducebf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x56,0x51,0x7f,0x7b]
- vreducenepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
+ vreducebf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
-// CHECK: vreducenepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
+// CHECK: vreducebf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x9f,0x56,0x52,0x80,0x7b]
- vreducenepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
+ vreducebf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
-// CHECK: vreducenepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
+// CHECK: vreducebf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vreducenepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
+ vreducebf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
-// CHECK: vreducenepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
+// CHECK: vreducebf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vreducenepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
+ vreducebf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
-// CHECK: vreducenepbf16 ymm2, word ptr [eax]{1to16}, 123
+// CHECK: vreducebf16 ymm2, word ptr [eax]{1to16}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x56,0x10,0x7b]
- vreducenepbf16 ymm2, word ptr [eax]{1to16}, 123
+ vreducebf16 ymm2, word ptr [eax]{1to16}, 123
-// CHECK: vreducenepbf16 ymm2, ymmword ptr [2*ebp - 1024], 123
+// CHECK: vreducebf16 ymm2, ymmword ptr [2*ebp - 1024], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x56,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vreducenepbf16 ymm2, ymmword ptr [2*ebp - 1024], 123
+ vreducebf16 ymm2, ymmword ptr [2*ebp - 1024], 123
-// CHECK: vreducenepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
+// CHECK: vreducebf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x56,0x51,0x7f,0x7b]
- vreducenepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
+ vreducebf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
-// CHECK: vreducenepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
+// CHECK: vreducebf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xbf,0x56,0x52,0x80,0x7b]
- vreducenepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
+ vreducebf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
-// CHECK: vreducenepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
+// CHECK: vreducebf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vreducenepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
+ vreducebf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
-// CHECK: vreducenepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
+// CHECK: vreducebf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vreducenepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
+ vreducebf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
-// CHECK: vreducenepbf16 zmm2, word ptr [eax]{1to32}, 123
+// CHECK: vreducebf16 zmm2, word ptr [eax]{1to32}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x56,0x10,0x7b]
- vreducenepbf16 zmm2, word ptr [eax]{1to32}, 123
+ vreducebf16 zmm2, word ptr [eax]{1to32}, 123
-// CHECK: vreducenepbf16 zmm2, zmmword ptr [2*ebp - 2048], 123
+// CHECK: vreducebf16 zmm2, zmmword ptr [2*ebp - 2048], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x56,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vreducenepbf16 zmm2, zmmword ptr [2*ebp - 2048], 123
+ vreducebf16 zmm2, zmmword ptr [2*ebp - 2048], 123
-// CHECK: vreducenepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
+// CHECK: vreducebf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x56,0x51,0x7f,0x7b]
- vreducenepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
+ vreducebf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
-// CHECK: vreducenepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
+// CHECK: vreducebf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xdf,0x56,0x52,0x80,0x7b]
- vreducenepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
+ vreducebf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
-// CHECK: vrndscalenepbf16 zmm2, zmm3, 123
+// CHECK: vrndscalebf16 zmm2, zmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x08,0xd3,0x7b]
- vrndscalenepbf16 zmm2, zmm3, 123
+ vrndscalebf16 zmm2, zmm3, 123
-// CHECK: vrndscalenepbf16 zmm2 {k7}, zmm3, 123
+// CHECK: vrndscalebf16 zmm2 {k7}, zmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x08,0xd3,0x7b]
- vrndscalenepbf16 zmm2 {k7}, zmm3, 123
+ vrndscalebf16 zmm2 {k7}, zmm3, 123
-// CHECK: vrndscalenepbf16 zmm2 {k7} {z}, zmm3, 123
+// CHECK: vrndscalebf16 zmm2 {k7} {z}, zmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x08,0xd3,0x7b]
- vrndscalenepbf16 zmm2 {k7} {z}, zmm3, 123
+ vrndscalebf16 zmm2 {k7} {z}, zmm3, 123
-// CHECK: vrndscalenepbf16 ymm2, ymm3, 123
+// CHECK: vrndscalebf16 ymm2, ymm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x08,0xd3,0x7b]
- vrndscalenepbf16 ymm2, ymm3, 123
+ vrndscalebf16 ymm2, ymm3, 123
-// CHECK: vrndscalenepbf16 ymm2 {k7}, ymm3, 123
+// CHECK: vrndscalebf16 ymm2 {k7}, ymm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x08,0xd3,0x7b]
- vrndscalenepbf16 ymm2 {k7}, ymm3, 123
+ vrndscalebf16 ymm2 {k7}, ymm3, 123
-// CHECK: vrndscalenepbf16 ymm2 {k7} {z}, ymm3, 123
+// CHECK: vrndscalebf16 ymm2 {k7} {z}, ymm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x08,0xd3,0x7b]
- vrndscalenepbf16 ymm2 {k7} {z}, ymm3, 123
+ vrndscalebf16 ymm2 {k7} {z}, ymm3, 123
-// CHECK: vrndscalenepbf16 xmm2, xmm3, 123
+// CHECK: vrndscalebf16 xmm2, xmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x08,0xd3,0x7b]
- vrndscalenepbf16 xmm2, xmm3, 123
+ vrndscalebf16 xmm2, xmm3, 123
-// CHECK: vrndscalenepbf16 xmm2 {k7}, xmm3, 123
+// CHECK: vrndscalebf16 xmm2 {k7}, xmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x08,0xd3,0x7b]
- vrndscalenepbf16 xmm2 {k7}, xmm3, 123
+ vrndscalebf16 xmm2 {k7}, xmm3, 123
-// CHECK: vrndscalenepbf16 xmm2 {k7} {z}, xmm3, 123
+// CHECK: vrndscalebf16 xmm2 {k7} {z}, xmm3, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x08,0xd3,0x7b]
- vrndscalenepbf16 xmm2 {k7} {z}, xmm3, 123
+ vrndscalebf16 xmm2 {k7} {z}, xmm3, 123
-// CHECK: vrndscalenepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
+// CHECK: vrndscalebf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vrndscalenepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
+ vrndscalebf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
-// CHECK: vrndscalenepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
+// CHECK: vrndscalebf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vrndscalenepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
+ vrndscalebf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
-// CHECK: vrndscalenepbf16 xmm2, word ptr [eax]{1to8}, 123
+// CHECK: vrndscalebf16 xmm2, word ptr [eax]{1to8}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x08,0x10,0x7b]
- vrndscalenepbf16 xmm2, word ptr [eax]{1to8}, 123
+ vrndscalebf16 xmm2, word ptr [eax]{1to8}, 123
-// CHECK: vrndscalenepbf16 xmm2, xmmword ptr [2*ebp - 512], 123
+// CHECK: vrndscalebf16 xmm2, xmmword ptr [2*ebp - 512], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x08,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vrndscalenepbf16 xmm2, xmmword ptr [2*ebp - 512], 123
+ vrndscalebf16 xmm2, xmmword ptr [2*ebp - 512], 123
-// CHECK: vrndscalenepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
+// CHECK: vrndscalebf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x08,0x51,0x7f,0x7b]
- vrndscalenepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
+ vrndscalebf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
-// CHECK: vrndscalenepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
+// CHECK: vrndscalebf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x9f,0x08,0x52,0x80,0x7b]
- vrndscalenepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
+ vrndscalebf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
-// CHECK: vrndscalenepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
+// CHECK: vrndscalebf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vrndscalenepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
+ vrndscalebf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
-// CHECK: vrndscalenepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
+// CHECK: vrndscalebf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vrndscalenepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
+ vrndscalebf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
-// CHECK: vrndscalenepbf16 ymm2, word ptr [eax]{1to16}, 123
+// CHECK: vrndscalebf16 ymm2, word ptr [eax]{1to16}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x08,0x10,0x7b]
- vrndscalenepbf16 ymm2, word ptr [eax]{1to16}, 123
+ vrndscalebf16 ymm2, word ptr [eax]{1to16}, 123
-// CHECK: vrndscalenepbf16 ymm2, ymmword ptr [2*ebp - 1024], 123
+// CHECK: vrndscalebf16 ymm2, ymmword ptr [2*ebp - 1024], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x08,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vrndscalenepbf16 ymm2, ymmword ptr [2*ebp - 1024], 123
+ vrndscalebf16 ymm2, ymmword ptr [2*ebp - 1024], 123
-// CHECK: vrndscalenepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
+// CHECK: vrndscalebf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x08,0x51,0x7f,0x7b]
- vrndscalenepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
+ vrndscalebf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
-// CHECK: vrndscalenepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
+// CHECK: vrndscalebf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xbf,0x08,0x52,0x80,0x7b]
- vrndscalenepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
+ vrndscalebf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
-// CHECK: vrndscalenepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
+// CHECK: vrndscalebf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b]
- vrndscalenepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
+ vrndscalebf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
-// CHECK: vrndscalenepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
+// CHECK: vrndscalebf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b]
- vrndscalenepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
+ vrndscalebf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
-// CHECK: vrndscalenepbf16 zmm2, word ptr [eax]{1to32}, 123
+// CHECK: vrndscalebf16 zmm2, word ptr [eax]{1to32}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x08,0x10,0x7b]
- vrndscalenepbf16 zmm2, word ptr [eax]{1to32}, 123
+ vrndscalebf16 zmm2, word ptr [eax]{1to32}, 123
-// CHECK: vrndscalenepbf16 zmm2, zmmword ptr [2*ebp - 2048], 123
+// CHECK: vrndscalebf16 zmm2, zmmword ptr [2*ebp - 2048], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x08,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vrndscalenepbf16 zmm2, zmmword ptr [2*ebp - 2048], 123
+ vrndscalebf16 zmm2, zmmword ptr [2*ebp - 2048], 123
-// CHECK: vrndscalenepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
+// CHECK: vrndscalebf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x08,0x51,0x7f,0x7b]
- vrndscalenepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
+ vrndscalebf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
-// CHECK: vrndscalenepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
+// CHECK: vrndscalebf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0xdf,0x08,0x52,0x80,0x7b]
- vrndscalenepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
+ vrndscalebf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
-// CHECK: vrsqrtpbf16 xmm2, xmm3
+// CHECK: vrsqrtbf16 xmm2, xmm3
// CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4e,0xd3]
- vrsqrtpbf16 xmm2, xmm3
+ vrsqrtbf16 xmm2, xmm3
-// CHECK: vrsqrtpbf16 xmm2 {k7}, xmm3
+// CHECK: vrsqrtbf16 xmm2 {k7}, xmm3
// CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4e,0xd3]
- vrsqrtpbf16 xmm2 {k7}, xmm3
+ vrsqrtbf16 xmm2 {k7}, xmm3
-// CHECK: vrsqrtpbf16 xmm2 {k7} {z}, xmm3
+// CHECK: vrsqrtbf16 xmm2 {k7} {z}, xmm3
// CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4e,0xd3]
- vrsqrtpbf16 xmm2 {k7} {z}, xmm3
+ vrsqrtbf16 xmm2 {k7} {z}, xmm3
-// CHECK: vrsqrtpbf16 zmm2, zmm3
+// CHECK: vrsqrtbf16 zmm2, zmm3
// CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4e,0xd3]
- vrsqrtpbf16 zmm2, zmm3
+ vrsqrtbf16 zmm2, zmm3
-// CHECK: vrsqrtpbf16 zmm2 {k7}, zmm3
+// CHECK: vrsqrtbf16 zmm2 {k7}, zmm3
// CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4e,0xd3]
- vrsqrtpbf16 zmm2 {k7}, zmm3
+ vrsqrtbf16 zmm2 {k7}, zmm3
-// CHECK: vrsqrtpbf16 zmm2 {k7} {z}, zmm3
+// CHECK: vrsqrtbf16 zmm2 {k7} {z}, zmm3
// CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4e,0xd3]
- vrsqrtpbf16 zmm2 {k7} {z}, zmm3
+ vrsqrtbf16 zmm2 {k7} {z}, zmm3
-// CHECK: vrsqrtpbf16 ymm2, ymm3
+// CHECK: vrsqrtbf16 ymm2, ymm3
// CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4e,0xd3]
- vrsqrtpbf16 ymm2, ymm3
+ vrsqrtbf16 ymm2, ymm3
-// CHECK: vrsqrtpbf16 ymm2 {k7}, ymm3
+// CHECK: vrsqrtbf16 ymm2 {k7}, ymm3
// CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4e,0xd3]
- vrsqrtpbf16 ymm2 {k7}, ymm3
+ vrsqrtbf16 ymm2 {k7}, ymm3
-// CHECK: vrsqrtpbf16 ymm2 {k7} {z}, ymm3
+// CHECK: vrsqrtbf16 ymm2 {k7} {z}, ymm3
// CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4e,0xd3]
- vrsqrtpbf16 ymm2 {k7} {z}, ymm3
+ vrsqrtbf16 ymm2 {k7} {z}, ymm3
-// CHECK: vrsqrtpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vrsqrtbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vrsqrtpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
+ vrsqrtbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vrsqrtpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vrsqrtbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00]
- vrsqrtpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
+ vrsqrtbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vrsqrtpbf16 xmm2, word ptr [eax]{1to8}
+// CHECK: vrsqrtbf16 xmm2, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x7c,0x18,0x4e,0x10]
- vrsqrtpbf16 xmm2, word ptr [eax]{1to8}
+ vrsqrtbf16 xmm2, word ptr [eax]{1to8}
-// CHECK: vrsqrtpbf16 xmm2, xmmword ptr [2*ebp - 512]
+// CHECK: vrsqrtbf16 xmm2, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4e,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vrsqrtpbf16 xmm2, xmmword ptr [2*ebp - 512]
+ vrsqrtbf16 xmm2, xmmword ptr [2*ebp - 512]
-// CHECK: vrsqrtpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
+// CHECK: vrsqrtbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4e,0x51,0x7f]
- vrsqrtpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
+ vrsqrtbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
-// CHECK: vrsqrtpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
+// CHECK: vrsqrtbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x7c,0x9f,0x4e,0x52,0x80]
- vrsqrtpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
+ vrsqrtbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
-// CHECK: vrsqrtpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vrsqrtbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vrsqrtpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
+ vrsqrtbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vrsqrtpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vrsqrtbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00]
- vrsqrtpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
+ vrsqrtbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vrsqrtpbf16 ymm2, word ptr [eax]{1to16}
+// CHECK: vrsqrtbf16 ymm2, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x7c,0x38,0x4e,0x10]
- vrsqrtpbf16 ymm2, word ptr [eax]{1to16}
+ vrsqrtbf16 ymm2, word ptr [eax]{1to16}
-// CHECK: vrsqrtpbf16 ymm2, ymmword ptr [2*ebp - 1024]
+// CHECK: vrsqrtbf16 ymm2, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4e,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vrsqrtpbf16 ymm2, ymmword ptr [2*ebp - 1024]
+ vrsqrtbf16 ymm2, ymmword ptr [2*ebp - 1024]
-// CHECK: vrsqrtpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
+// CHECK: vrsqrtbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4e,0x51,0x7f]
- vrsqrtpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
+ vrsqrtbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
-// CHECK: vrsqrtpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
+// CHECK: vrsqrtbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x7c,0xbf,0x4e,0x52,0x80]
- vrsqrtpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
+ vrsqrtbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
-// CHECK: vrsqrtpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vrsqrtbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10]
- vrsqrtpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
+ vrsqrtbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vrsqrtpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vrsqrtbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00]
- vrsqrtpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
+ vrsqrtbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vrsqrtpbf16 zmm2, word ptr [eax]{1to32}
+// CHECK: vrsqrtbf16 zmm2, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x7c,0x58,0x4e,0x10]
- vrsqrtpbf16 zmm2, word ptr [eax]{1to32}
+ vrsqrtbf16 zmm2, word ptr [eax]{1to32}
-// CHECK: vrsqrtpbf16 zmm2, zmmword ptr [2*ebp - 2048]
+// CHECK: vrsqrtbf16 zmm2, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4e,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vrsqrtpbf16 zmm2, zmmword ptr [2*ebp - 2048]
+ vrsqrtbf16 zmm2, zmmword ptr [2*ebp - 2048]
-// CHECK: vrsqrtpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
+// CHECK: vrsqrtbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4e,0x51,0x7f]
- vrsqrtpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
+ vrsqrtbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
-// CHECK: vrsqrtpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
+// CHECK: vrsqrtbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x7c,0xdf,0x4e,0x52,0x80]
- vrsqrtpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
+ vrsqrtbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
-// CHECK: vscalefpbf16 ymm2, ymm3, ymm4
+// CHECK: vscalefbf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x2c,0xd4]
- vscalefpbf16 ymm2, ymm3, ymm4
+ vscalefbf16 ymm2, ymm3, ymm4
-// CHECK: vscalefpbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vscalefbf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x2c,0xd4]
- vscalefpbf16 ymm2 {k7}, ymm3, ymm4
+ vscalefbf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vscalefpbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vscalefbf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x2c,0xd4]
- vscalefpbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vscalefbf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vscalefpbf16 zmm2, zmm3, zmm4
+// CHECK: vscalefbf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x2c,0xd4]
- vscalefpbf16 zmm2, zmm3, zmm4
+ vscalefbf16 zmm2, zmm3, zmm4
-// CHECK: vscalefpbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vscalefbf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x2c,0xd4]
- vscalefpbf16 zmm2 {k7}, zmm3, zmm4
+ vscalefbf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vscalefpbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vscalefbf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x2c,0xd4]
- vscalefpbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vscalefbf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vscalefpbf16 xmm2, xmm3, xmm4
+// CHECK: vscalefbf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x2c,0xd4]
- vscalefpbf16 xmm2, xmm3, xmm4
+ vscalefbf16 xmm2, xmm3, xmm4
-// CHECK: vscalefpbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vscalefbf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x2c,0xd4]
- vscalefpbf16 xmm2 {k7}, xmm3, xmm4
+ vscalefbf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vscalefpbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vscalefbf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x2c,0xd4]
- vscalefpbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vscalefbf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vscalefpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vscalefbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vscalefpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vscalefbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vscalefpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vscalefbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00]
- vscalefpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vscalefbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vscalefpbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vscalefbf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0x58,0x2c,0x10]
- vscalefpbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vscalefbf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vscalefpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vscalefbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf6,0x64,0x48,0x2c,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vscalefpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vscalefbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vscalefpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vscalefbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x2c,0x51,0x7f]
- vscalefpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vscalefbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vscalefpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vscalefbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x2c,0x52,0x80]
- vscalefpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vscalefbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vscalefpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vscalefbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vscalefpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vscalefbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vscalefpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vscalefbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00]
- vscalefpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vscalefbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vscalefpbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vscalefbf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0x38,0x2c,0x10]
- vscalefpbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vscalefbf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vscalefpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vscalefbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf6,0x64,0x28,0x2c,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vscalefpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vscalefbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vscalefpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vscalefbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x2c,0x51,0x7f]
- vscalefpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vscalefbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vscalefpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vscalefbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x2c,0x52,0x80]
- vscalefpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vscalefbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vscalefpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vscalefbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vscalefpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vscalefbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vscalefpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vscalefbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00]
- vscalefpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vscalefbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vscalefpbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vscalefbf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x18,0x2c,0x10]
- vscalefpbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vscalefbf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vscalefpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vscalefbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf6,0x64,0x08,0x2c,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vscalefpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vscalefbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vscalefpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vscalefbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x2c,0x51,0x7f]
- vscalefpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vscalefbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vscalefpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vscalefbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x2c,0x52,0x80]
- vscalefpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vscalefbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
-// CHECK: vsqrtnepbf16 xmm2, xmm3
+// CHECK: vsqrtbf16 xmm2, xmm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x51,0xd3]
- vsqrtnepbf16 xmm2, xmm3
+ vsqrtbf16 xmm2, xmm3
-// CHECK: vsqrtnepbf16 xmm2 {k7}, xmm3
+// CHECK: vsqrtbf16 xmm2 {k7}, xmm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x51,0xd3]
- vsqrtnepbf16 xmm2 {k7}, xmm3
+ vsqrtbf16 xmm2 {k7}, xmm3
-// CHECK: vsqrtnepbf16 xmm2 {k7} {z}, xmm3
+// CHECK: vsqrtbf16 xmm2 {k7} {z}, xmm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x51,0xd3]
- vsqrtnepbf16 xmm2 {k7} {z}, xmm3
+ vsqrtbf16 xmm2 {k7} {z}, xmm3
-// CHECK: vsqrtnepbf16 zmm2, zmm3
+// CHECK: vsqrtbf16 zmm2, zmm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x51,0xd3]
- vsqrtnepbf16 zmm2, zmm3
+ vsqrtbf16 zmm2, zmm3
-// CHECK: vsqrtnepbf16 zmm2 {k7}, zmm3
+// CHECK: vsqrtbf16 zmm2 {k7}, zmm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x51,0xd3]
- vsqrtnepbf16 zmm2 {k7}, zmm3
+ vsqrtbf16 zmm2 {k7}, zmm3
-// CHECK: vsqrtnepbf16 zmm2 {k7} {z}, zmm3
+// CHECK: vsqrtbf16 zmm2 {k7} {z}, zmm3
// CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x51,0xd3]
- vsqrtnepbf16 zmm2 {k7} {z}, zmm3
+ vsqrtbf16 zmm2 {k7} {z}, zmm3
-// CHECK: vsqrtnepbf16 ymm2, ymm3
+// CHECK: vsqrtbf16 ymm2, ymm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x51,0xd3]
- vsqrtnepbf16 ymm2, ymm3
+ vsqrtbf16 ymm2, ymm3
-// CHECK: vsqrtnepbf16 ymm2 {k7}, ymm3
+// CHECK: vsqrtbf16 ymm2 {k7}, ymm3
// CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x51,0xd3]
- vsqrtnepbf16 ymm2 {k7}, ymm3
+ vsqrtbf16 ymm2 {k7}, ymm3
-// CHECK: vsqrtnepbf16 ymm2 {k7} {z}, ymm3
+// CHECK: vsqrtbf16 ymm2 {k7} {z}, ymm3
// CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x51,0xd3]
- vsqrtnepbf16 ymm2 {k7} {z}, ymm3
+ vsqrtbf16 ymm2 {k7} {z}, ymm3
-// CHECK: vsqrtnepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vsqrtbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x51,0x94,0xf4,0x00,0x00,0x00,0x10]
- vsqrtnepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
+ vsqrtbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vsqrtnepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vsqrtbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x51,0x94,0x87,0x23,0x01,0x00,0x00]
- vsqrtnepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
+ vsqrtbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vsqrtnepbf16 xmm2, word ptr [eax]{1to8}
+// CHECK: vsqrtbf16 xmm2, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf5,0x7d,0x18,0x51,0x10]
- vsqrtnepbf16 xmm2, word ptr [eax]{1to8}
+ vsqrtbf16 xmm2, word ptr [eax]{1to8}
-// CHECK: vsqrtnepbf16 xmm2, xmmword ptr [2*ebp - 512]
+// CHECK: vsqrtbf16 xmm2, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x51,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vsqrtnepbf16 xmm2, xmmword ptr [2*ebp - 512]
+ vsqrtbf16 xmm2, xmmword ptr [2*ebp - 512]
-// CHECK: vsqrtnepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
+// CHECK: vsqrtbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x51,0x51,0x7f]
- vsqrtnepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
+ vsqrtbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
-// CHECK: vsqrtnepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
+// CHECK: vsqrtbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf5,0x7d,0x9f,0x51,0x52,0x80]
- vsqrtnepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
+ vsqrtbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
-// CHECK: vsqrtnepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vsqrtbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x51,0x94,0xf4,0x00,0x00,0x00,0x10]
- vsqrtnepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
+ vsqrtbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vsqrtnepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vsqrtbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x51,0x94,0x87,0x23,0x01,0x00,0x00]
- vsqrtnepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
+ vsqrtbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vsqrtnepbf16 ymm2, word ptr [eax]{1to16}
+// CHECK: vsqrtbf16 ymm2, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf5,0x7d,0x38,0x51,0x10]
- vsqrtnepbf16 ymm2, word ptr [eax]{1to16}
+ vsqrtbf16 ymm2, word ptr [eax]{1to16}
-// CHECK: vsqrtnepbf16 ymm2, ymmword ptr [2*ebp - 1024]
+// CHECK: vsqrtbf16 ymm2, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x51,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vsqrtnepbf16 ymm2, ymmword ptr [2*ebp - 1024]
+ vsqrtbf16 ymm2, ymmword ptr [2*ebp - 1024]
-// CHECK: vsqrtnepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
+// CHECK: vsqrtbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x51,0x51,0x7f]
- vsqrtnepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
+ vsqrtbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
-// CHECK: vsqrtnepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
+// CHECK: vsqrtbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf5,0x7d,0xbf,0x51,0x52,0x80]
- vsqrtnepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
+ vsqrtbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
-// CHECK: vsqrtnepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vsqrtbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x51,0x94,0xf4,0x00,0x00,0x00,0x10]
- vsqrtnepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
+ vsqrtbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vsqrtnepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vsqrtbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x51,0x94,0x87,0x23,0x01,0x00,0x00]
- vsqrtnepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
+ vsqrtbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vsqrtnepbf16 zmm2, word ptr [eax]{1to32}
+// CHECK: vsqrtbf16 zmm2, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf5,0x7d,0x58,0x51,0x10]
- vsqrtnepbf16 zmm2, word ptr [eax]{1to32}
+ vsqrtbf16 zmm2, word ptr [eax]{1to32}
-// CHECK: vsqrtnepbf16 zmm2, zmmword ptr [2*ebp - 2048]
+// CHECK: vsqrtbf16 zmm2, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x51,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vsqrtnepbf16 zmm2, zmmword ptr [2*ebp - 2048]
+ vsqrtbf16 zmm2, zmmword ptr [2*ebp - 2048]
-// CHECK: vsqrtnepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
+// CHECK: vsqrtbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x51,0x51,0x7f]
- vsqrtnepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
+ vsqrtbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
-// CHECK: vsqrtnepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
+// CHECK: vsqrtbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf5,0x7d,0xdf,0x51,0x52,0x80]
- vsqrtnepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
+ vsqrtbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
-// CHECK: vsubnepbf16 ymm2, ymm3, ymm4
+// CHECK: vsubbf16 ymm2, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5c,0xd4]
- vsubnepbf16 ymm2, ymm3, ymm4
+ vsubbf16 ymm2, ymm3, ymm4
-// CHECK: vsubnepbf16 ymm2 {k7}, ymm3, ymm4
+// CHECK: vsubbf16 ymm2 {k7}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5c,0xd4]
- vsubnepbf16 ymm2 {k7}, ymm3, ymm4
+ vsubbf16 ymm2 {k7}, ymm3, ymm4
-// CHECK: vsubnepbf16 ymm2 {k7} {z}, ymm3, ymm4
+// CHECK: vsubbf16 ymm2 {k7} {z}, ymm3, ymm4
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5c,0xd4]
- vsubnepbf16 ymm2 {k7} {z}, ymm3, ymm4
+ vsubbf16 ymm2 {k7} {z}, ymm3, ymm4
-// CHECK: vsubnepbf16 zmm2, zmm3, zmm4
+// CHECK: vsubbf16 zmm2, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5c,0xd4]
- vsubnepbf16 zmm2, zmm3, zmm4
+ vsubbf16 zmm2, zmm3, zmm4
-// CHECK: vsubnepbf16 zmm2 {k7}, zmm3, zmm4
+// CHECK: vsubbf16 zmm2 {k7}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5c,0xd4]
- vsubnepbf16 zmm2 {k7}, zmm3, zmm4
+ vsubbf16 zmm2 {k7}, zmm3, zmm4
-// CHECK: vsubnepbf16 zmm2 {k7} {z}, zmm3, zmm4
+// CHECK: vsubbf16 zmm2 {k7} {z}, zmm3, zmm4
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5c,0xd4]
- vsubnepbf16 zmm2 {k7} {z}, zmm3, zmm4
+ vsubbf16 zmm2 {k7} {z}, zmm3, zmm4
-// CHECK: vsubnepbf16 xmm2, xmm3, xmm4
+// CHECK: vsubbf16 xmm2, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5c,0xd4]
- vsubnepbf16 xmm2, xmm3, xmm4
+ vsubbf16 xmm2, xmm3, xmm4
-// CHECK: vsubnepbf16 xmm2 {k7}, xmm3, xmm4
+// CHECK: vsubbf16 xmm2 {k7}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5c,0xd4]
- vsubnepbf16 xmm2 {k7}, xmm3, xmm4
+ vsubbf16 xmm2 {k7}, xmm3, xmm4
-// CHECK: vsubnepbf16 xmm2 {k7} {z}, xmm3, xmm4
+// CHECK: vsubbf16 xmm2 {k7} {z}, xmm3, xmm4
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5c,0xd4]
- vsubnepbf16 xmm2 {k7} {z}, xmm3, xmm4
+ vsubbf16 xmm2 {k7} {z}, xmm3, xmm4
-// CHECK: vsubnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vsubbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vsubnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
+ vsubbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vsubnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+// CHECK: vsubbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00]
- vsubnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
+ vsubbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
-// CHECK: vsubnepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+// CHECK: vsubbf16 zmm2, zmm3, word ptr [eax]{1to32}
// CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5c,0x10]
- vsubnepbf16 zmm2, zmm3, word ptr [eax]{1to32}
+ vsubbf16 zmm2, zmm3, word ptr [eax]{1to32}
-// CHECK: vsubnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+// CHECK: vsubbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
// CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5c,0x14,0x6d,0x00,0xf8,0xff,0xff]
- vsubnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
+ vsubbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
-// CHECK: vsubnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+// CHECK: vsubbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
// CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5c,0x51,0x7f]
- vsubnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
+ vsubbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
-// CHECK: vsubnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+// CHECK: vsubbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
// CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5c,0x52,0x80]
- vsubnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
+ vsubbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
-// CHECK: vsubnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+// CHECK: vsubbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vsubnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
+ vsubbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
-// CHECK: vsubnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+// CHECK: vsubbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00]
- vsubnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
+ vsubbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
-// CHECK: vsubnepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+// CHECK: vsubbf16 ymm2, ymm3, word ptr [eax]{1to16}
// CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5c,0x10]
- vsubnepbf16 ymm2, ymm3, word ptr [eax]{1to16}
+ vsubbf16 ymm2, ymm3, word ptr [eax]{1to16}
-// CHECK: vsubnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+// CHECK: vsubbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
// CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5c,0x14,0x6d,0x00,0xfc,0xff,0xff]
- vsubnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
+ vsubbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
-// CHECK: vsubnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+// CHECK: vsubbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
// CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5c,0x51,0x7f]
- vsubnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
+ vsubbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
-// CHECK: vsubnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+// CHECK: vsubbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
// CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5c,0x52,0x80]
- vsubnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
+ vsubbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
-// CHECK: vsubnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+// CHECK: vsubbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10]
- vsubnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
+ vsubbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
-// CHECK: vsubnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+// CHECK: vsubbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
// CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00]
- vsubnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
+ vsubbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
-// CHECK: vsubnepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+// CHECK: vsubbf16 xmm2, xmm3, word ptr [eax]{1to8}
// CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5c,0x10]
- vsubnepbf16 xmm2, xmm3, word ptr [eax]{1to8}
+ vsubbf16 xmm2, xmm3, word ptr [eax]{1to8}
-// CHECK: vsubnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+// CHECK: vsubbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
// CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5c,0x14,0x6d,0x00,0xfe,0xff,0xff]
- vsubnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
+ vsubbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
-// CHECK: vsubnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+// CHECK: vsubbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
// CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5c,0x51,0x7f]
- vsubnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
+ vsubbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
-// CHECK: vsubnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+// CHECK: vsubbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
// CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5c,0x52,0x80]
- vsubnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
+ vsubbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
diff --git a/llvm/test/MC/X86/avx10.2-bf16-64-att.s b/llvm/test/MC/X86/avx10.2-bf16-64-att.s
index 85d99cfe0a7043..d960dca940c80e 100644
--- a/llvm/test/MC/X86/avx10.2-bf16-64-att.s
+++ b/llvm/test/MC/X86/avx10.2-bf16-64-att.s
@@ -1,208 +1,208 @@
// RUN: llvm-mc -triple x86_64 --show-encoding %s | FileCheck %s
-// CHECK: vaddnepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vaddbf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x85,0x45,0x20,0x58,0xf0]
- vaddnepbf16 %ymm24, %ymm23, %ymm22
+ vaddbf16 %ymm24, %ymm23, %ymm22
-// CHECK: vaddnepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vaddbf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x27,0x58,0xf0]
- vaddnepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vaddbf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vaddnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vaddbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0xa7,0x58,0xf0]
- vaddnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vaddbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vaddnepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vaddbf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x85,0x45,0x40,0x58,0xf0]
- vaddnepbf16 %zmm24, %zmm23, %zmm22
+ vaddbf16 %zmm24, %zmm23, %zmm22
-// CHECK: vaddnepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vaddbf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x47,0x58,0xf0]
- vaddnepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vaddbf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vaddnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vaddbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0xc7,0x58,0xf0]
- vaddnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vaddbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vaddnepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vaddbf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x85,0x45,0x00,0x58,0xf0]
- vaddnepbf16 %xmm24, %xmm23, %xmm22
+ vaddbf16 %xmm24, %xmm23, %xmm22
-// CHECK: vaddnepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vaddbf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x07,0x58,0xf0]
- vaddnepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vaddbf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vaddnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vaddbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0x87,0x58,0xf0]
- vaddnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vaddbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vaddnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vaddbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa5,0x45,0x40,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vaddnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vaddbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vaddnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vaddbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x47,0x58,0xb4,0x80,0x23,0x01,0x00,0x00]
- vaddnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vaddbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vaddnepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vaddbf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x50,0x58,0x35,0x00,0x00,0x00,0x00]
- vaddnepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vaddbf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vaddnepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vaddbf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x40,0x58,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vaddnepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vaddbf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vaddnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vaddbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x58,0x71,0x7f]
- vaddnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vaddbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vaddnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vaddbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x58,0x72,0x80]
- vaddnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vaddbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vaddnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vaddbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa5,0x45,0x20,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vaddnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vaddbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vaddnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vaddbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x27,0x58,0xb4,0x80,0x23,0x01,0x00,0x00]
- vaddnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vaddbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vaddnepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vaddbf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe5,0x45,0x30,0x58,0x35,0x00,0x00,0x00,0x00]
- vaddnepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vaddbf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vaddnepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vaddbf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe5,0x45,0x20,0x58,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vaddnepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vaddbf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vaddnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vaddbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x58,0x71,0x7f]
- vaddnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vaddbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vaddnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vaddbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x58,0x72,0x80]
- vaddnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vaddbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vaddnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vaddbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa5,0x45,0x00,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vaddnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vaddbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vaddnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vaddbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x07,0x58,0xb4,0x80,0x23,0x01,0x00,0x00]
- vaddnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vaddbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vaddnepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vaddbf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x10,0x58,0x35,0x00,0x00,0x00,0x00]
- vaddnepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vaddbf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vaddnepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vaddbf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x00,0x58,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vaddnepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vaddbf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vaddnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vaddbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0x87,0x58,0x71,0x7f]
- vaddnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vaddbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vaddnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vaddbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0x97,0x58,0x72,0x80]
- vaddnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vaddbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vcmppbf16 $123, %ymm24, %ymm23, %k5
+// CHECK: vcmpbf16 $123, %ymm24, %ymm23, %k5
// CHECK: encoding: [0x62,0x93,0x47,0x20,0xc2,0xe8,0x7b]
- vcmppbf16 $123, %ymm24, %ymm23, %k5
+ vcmpbf16 $123, %ymm24, %ymm23, %k5
-// CHECK: vcmppbf16 $123, %ymm24, %ymm23, %k5 {%k7}
+// CHECK: vcmpbf16 $123, %ymm24, %ymm23, %k5 {%k7}
// CHECK: encoding: [0x62,0x93,0x47,0x27,0xc2,0xe8,0x7b]
- vcmppbf16 $123, %ymm24, %ymm23, %k5 {%k7}
+ vcmpbf16 $123, %ymm24, %ymm23, %k5 {%k7}
-// CHECK: vcmppbf16 $123, %xmm24, %xmm23, %k5
+// CHECK: vcmpbf16 $123, %xmm24, %xmm23, %k5
// CHECK: encoding: [0x62,0x93,0x47,0x00,0xc2,0xe8,0x7b]
- vcmppbf16 $123, %xmm24, %xmm23, %k5
+ vcmpbf16 $123, %xmm24, %xmm23, %k5
-// CHECK: vcmppbf16 $123, %xmm24, %xmm23, %k5 {%k7}
+// CHECK: vcmpbf16 $123, %xmm24, %xmm23, %k5 {%k7}
// CHECK: encoding: [0x62,0x93,0x47,0x07,0xc2,0xe8,0x7b]
- vcmppbf16 $123, %xmm24, %xmm23, %k5 {%k7}
+ vcmpbf16 $123, %xmm24, %xmm23, %k5 {%k7}
-// CHECK: vcmppbf16 $123, %zmm24, %zmm23, %k5
+// CHECK: vcmpbf16 $123, %zmm24, %zmm23, %k5
// CHECK: encoding: [0x62,0x93,0x47,0x40,0xc2,0xe8,0x7b]
- vcmppbf16 $123, %zmm24, %zmm23, %k5
+ vcmpbf16 $123, %zmm24, %zmm23, %k5
-// CHECK: vcmppbf16 $123, %zmm24, %zmm23, %k5 {%k7}
+// CHECK: vcmpbf16 $123, %zmm24, %zmm23, %k5 {%k7}
// CHECK: encoding: [0x62,0x93,0x47,0x47,0xc2,0xe8,0x7b]
- vcmppbf16 $123, %zmm24, %zmm23, %k5 {%k7}
+ vcmpbf16 $123, %zmm24, %zmm23, %k5 {%k7}
-// CHECK: vcmppbf16 $123, 268435456(%rbp,%r14,8), %zmm23, %k5
+// CHECK: vcmpbf16 $123, 268435456(%rbp,%r14,8), %zmm23, %k5
// CHECK: encoding: [0x62,0xb3,0x47,0x40,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vcmppbf16 $123, 268435456(%rbp,%r14,8), %zmm23, %k5
+ vcmpbf16 $123, 268435456(%rbp,%r14,8), %zmm23, %k5
-// CHECK: vcmppbf16 $123, 291(%r8,%rax,4), %zmm23, %k5 {%k7}
+// CHECK: vcmpbf16 $123, 291(%r8,%rax,4), %zmm23, %k5 {%k7}
// CHECK: encoding: [0x62,0xd3,0x47,0x47,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b]
- vcmppbf16 $123, 291(%r8,%rax,4), %zmm23, %k5 {%k7}
+ vcmpbf16 $123, 291(%r8,%rax,4), %zmm23, %k5 {%k7}
-// CHECK: vcmppbf16 $123, (%rip){1to32}, %zmm23, %k5
+// CHECK: vcmpbf16 $123, (%rip){1to32}, %zmm23, %k5
// CHECK: encoding: [0x62,0xf3,0x47,0x50,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b]
- vcmppbf16 $123, (%rip){1to32}, %zmm23, %k5
+ vcmpbf16 $123, (%rip){1to32}, %zmm23, %k5
-// CHECK: vcmppbf16 $123, -2048(,%rbp,2), %zmm23, %k5
+// CHECK: vcmpbf16 $123, -2048(,%rbp,2), %zmm23, %k5
// CHECK: encoding: [0x62,0xf3,0x47,0x40,0xc2,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vcmppbf16 $123, -2048(,%rbp,2), %zmm23, %k5
+ vcmpbf16 $123, -2048(,%rbp,2), %zmm23, %k5
-// CHECK: vcmppbf16 $123, 8128(%rcx), %zmm23, %k5 {%k7}
+// CHECK: vcmpbf16 $123, 8128(%rcx), %zmm23, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x47,0x47,0xc2,0x69,0x7f,0x7b]
- vcmppbf16 $123, 8128(%rcx), %zmm23, %k5 {%k7}
+ vcmpbf16 $123, 8128(%rcx), %zmm23, %k5 {%k7}
-// CHECK: vcmppbf16 $123, -256(%rdx){1to32}, %zmm23, %k5 {%k7}
+// CHECK: vcmpbf16 $123, -256(%rdx){1to32}, %zmm23, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x47,0x57,0xc2,0x6a,0x80,0x7b]
- vcmppbf16 $123, -256(%rdx){1to32}, %zmm23, %k5 {%k7}
+ vcmpbf16 $123, -256(%rdx){1to32}, %zmm23, %k5 {%k7}
-// CHECK: vcmppbf16 $123, 268435456(%rbp,%r14,8), %xmm23, %k5
+// CHECK: vcmpbf16 $123, 268435456(%rbp,%r14,8), %xmm23, %k5
// CHECK: encoding: [0x62,0xb3,0x47,0x00,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vcmppbf16 $123, 268435456(%rbp,%r14,8), %xmm23, %k5
+ vcmpbf16 $123, 268435456(%rbp,%r14,8), %xmm23, %k5
-// CHECK: vcmppbf16 $123, 291(%r8,%rax,4), %xmm23, %k5 {%k7}
+// CHECK: vcmpbf16 $123, 291(%r8,%rax,4), %xmm23, %k5 {%k7}
// CHECK: encoding: [0x62,0xd3,0x47,0x07,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b]
- vcmppbf16 $123, 291(%r8,%rax,4), %xmm23, %k5 {%k7}
+ vcmpbf16 $123, 291(%r8,%rax,4), %xmm23, %k5 {%k7}
-// CHECK: vcmppbf16 $123, (%rip){1to8}, %xmm23, %k5
+// CHECK: vcmpbf16 $123, (%rip){1to8}, %xmm23, %k5
// CHECK: encoding: [0x62,0xf3,0x47,0x10,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b]
- vcmppbf16 $123, (%rip){1to8}, %xmm23, %k5
+ vcmpbf16 $123, (%rip){1to8}, %xmm23, %k5
-// CHECK: vcmppbf16 $123, -512(,%rbp,2), %xmm23, %k5
+// CHECK: vcmpbf16 $123, -512(,%rbp,2), %xmm23, %k5
// CHECK: encoding: [0x62,0xf3,0x47,0x00,0xc2,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vcmppbf16 $123, -512(,%rbp,2), %xmm23, %k5
+ vcmpbf16 $123, -512(,%rbp,2), %xmm23, %k5
-// CHECK: vcmppbf16 $123, 2032(%rcx), %xmm23, %k5 {%k7}
+// CHECK: vcmpbf16 $123, 2032(%rcx), %xmm23, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x47,0x07,0xc2,0x69,0x7f,0x7b]
- vcmppbf16 $123, 2032(%rcx), %xmm23, %k5 {%k7}
+ vcmpbf16 $123, 2032(%rcx), %xmm23, %k5 {%k7}
-// CHECK: vcmppbf16 $123, -256(%rdx){1to8}, %xmm23, %k5 {%k7}
+// CHECK: vcmpbf16 $123, -256(%rdx){1to8}, %xmm23, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x47,0x17,0xc2,0x6a,0x80,0x7b]
- vcmppbf16 $123, -256(%rdx){1to8}, %xmm23, %k5 {%k7}
+ vcmpbf16 $123, -256(%rdx){1to8}, %xmm23, %k5 {%k7}
-// CHECK: vcmppbf16 $123, 268435456(%rbp,%r14,8), %ymm23, %k5
+// CHECK: vcmpbf16 $123, 268435456(%rbp,%r14,8), %ymm23, %k5
// CHECK: encoding: [0x62,0xb3,0x47,0x20,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vcmppbf16 $123, 268435456(%rbp,%r14,8), %ymm23, %k5
+ vcmpbf16 $123, 268435456(%rbp,%r14,8), %ymm23, %k5
-// CHECK: vcmppbf16 $123, 291(%r8,%rax,4), %ymm23, %k5 {%k7}
+// CHECK: vcmpbf16 $123, 291(%r8,%rax,4), %ymm23, %k5 {%k7}
// CHECK: encoding: [0x62,0xd3,0x47,0x27,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b]
- vcmppbf16 $123, 291(%r8,%rax,4), %ymm23, %k5 {%k7}
+ vcmpbf16 $123, 291(%r8,%rax,4), %ymm23, %k5 {%k7}
-// CHECK: vcmppbf16 $123, (%rip){1to16}, %ymm23, %k5
+// CHECK: vcmpbf16 $123, (%rip){1to16}, %ymm23, %k5
// CHECK: encoding: [0x62,0xf3,0x47,0x30,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b]
- vcmppbf16 $123, (%rip){1to16}, %ymm23, %k5
+ vcmpbf16 $123, (%rip){1to16}, %ymm23, %k5
-// CHECK: vcmppbf16 $123, -1024(,%rbp,2), %ymm23, %k5
+// CHECK: vcmpbf16 $123, -1024(,%rbp,2), %ymm23, %k5
// CHECK: encoding: [0x62,0xf3,0x47,0x20,0xc2,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vcmppbf16 $123, -1024(,%rbp,2), %ymm23, %k5
+ vcmpbf16 $123, -1024(,%rbp,2), %ymm23, %k5
-// CHECK: vcmppbf16 $123, 4064(%rcx), %ymm23, %k5 {%k7}
+// CHECK: vcmpbf16 $123, 4064(%rcx), %ymm23, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x47,0x27,0xc2,0x69,0x7f,0x7b]
- vcmppbf16 $123, 4064(%rcx), %ymm23, %k5 {%k7}
+ vcmpbf16 $123, 4064(%rcx), %ymm23, %k5 {%k7}
-// CHECK: vcmppbf16 $123, -256(%rdx){1to16}, %ymm23, %k5 {%k7}
+// CHECK: vcmpbf16 $123, -256(%rdx){1to16}, %ymm23, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x47,0x37,0xc2,0x6a,0x80,0x7b]
- vcmppbf16 $123, -256(%rdx){1to16}, %ymm23, %k5 {%k7}
+ vcmpbf16 $123, -256(%rdx){1to16}, %ymm23, %k5 {%k7}
// CHECK: vcomsbf16 %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x2f,0xf7]
@@ -232,2783 +232,2783 @@
// CHECK: encoding: [0x62,0xe5,0x7d,0x08,0x2f,0x72,0x80]
vcomsbf16 -256(%rdx), %xmm22
-// CHECK: vdivnepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vdivbf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x85,0x45,0x20,0x5e,0xf0]
- vdivnepbf16 %ymm24, %ymm23, %ymm22
+ vdivbf16 %ymm24, %ymm23, %ymm22
-// CHECK: vdivnepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vdivbf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x27,0x5e,0xf0]
- vdivnepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vdivbf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vdivnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vdivbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5e,0xf0]
- vdivnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vdivbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vdivnepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vdivbf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x85,0x45,0x40,0x5e,0xf0]
- vdivnepbf16 %zmm24, %zmm23, %zmm22
+ vdivbf16 %zmm24, %zmm23, %zmm22
-// CHECK: vdivnepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vdivbf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x47,0x5e,0xf0]
- vdivnepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vdivbf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vdivnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vdivbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5e,0xf0]
- vdivnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vdivbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vdivnepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vdivbf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x85,0x45,0x00,0x5e,0xf0]
- vdivnepbf16 %xmm24, %xmm23, %xmm22
+ vdivbf16 %xmm24, %xmm23, %xmm22
-// CHECK: vdivnepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vdivbf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x07,0x5e,0xf0]
- vdivnepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vdivbf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vdivnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vdivbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0x87,0x5e,0xf0]
- vdivnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vdivbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vdivnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vdivbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vdivnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vdivbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vdivnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vdivbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vdivnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vdivbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vdivnepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vdivbf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5e,0x35,0x00,0x00,0x00,0x00]
- vdivnepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vdivbf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vdivnepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vdivbf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5e,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vdivnepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vdivbf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vdivnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vdivbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5e,0x71,0x7f]
- vdivnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vdivbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vdivnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vdivbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5e,0x72,0x80]
- vdivnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vdivbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vdivnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vdivbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vdivnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vdivbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vdivnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vdivbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vdivnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vdivbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vdivnepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vdivbf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5e,0x35,0x00,0x00,0x00,0x00]
- vdivnepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vdivbf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vdivnepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vdivbf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5e,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vdivnepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vdivbf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vdivnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vdivbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5e,0x71,0x7f]
- vdivnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vdivbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vdivnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vdivbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5e,0x72,0x80]
- vdivnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vdivbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vdivnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vdivbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vdivnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vdivbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vdivnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vdivbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vdivnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vdivbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vdivnepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vdivbf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5e,0x35,0x00,0x00,0x00,0x00]
- vdivnepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vdivbf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vdivnepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vdivbf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5e,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vdivnepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vdivbf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vdivnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vdivbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5e,0x71,0x7f]
- vdivnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vdivbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vdivnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vdivbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5e,0x72,0x80]
- vdivnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vdivbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmadd132nepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vfmadd132bf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x86,0x44,0x20,0x98,0xf0]
- vfmadd132nepbf16 %ymm24, %ymm23, %ymm22
+ vfmadd132bf16 %ymm24, %ymm23, %ymm22
-// CHECK: vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vfmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x27,0x98,0xf0]
- vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vfmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0x98,0xf0]
- vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vfmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmadd132nepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vfmadd132bf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x86,0x44,0x40,0x98,0xf0]
- vfmadd132nepbf16 %zmm24, %zmm23, %zmm22
+ vfmadd132bf16 %zmm24, %zmm23, %zmm22
-// CHECK: vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vfmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x47,0x98,0xf0]
- vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vfmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0x98,0xf0]
- vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vfmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmadd132nepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vfmadd132bf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x86,0x44,0x00,0x98,0xf0]
- vfmadd132nepbf16 %xmm24, %xmm23, %xmm22
+ vfmadd132bf16 %xmm24, %xmm23, %xmm22
-// CHECK: vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vfmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x07,0x98,0xf0]
- vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vfmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0x87,0x98,0xf0]
- vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vfmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmadd132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vfmadd132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vfmadd132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vfmadd132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vfmadd132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0x98,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vfmadd132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vfmadd132nepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vfmadd132bf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0x98,0x35,0x00,0x00,0x00,0x00]
- vfmadd132nepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vfmadd132bf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vfmadd132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vfmadd132bf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0x98,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfmadd132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vfmadd132bf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vfmadd132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmadd132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x98,0x71,0x7f]
- vfmadd132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vfmadd132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmadd132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmadd132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x98,0x72,0x80]
- vfmadd132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vfmadd132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmadd132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vfmadd132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vfmadd132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vfmadd132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vfmadd132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0x98,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vfmadd132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vfmadd132nepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vfmadd132bf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0x98,0x35,0x00,0x00,0x00,0x00]
- vfmadd132nepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vfmadd132bf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vfmadd132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vfmadd132bf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0x98,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfmadd132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vfmadd132bf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vfmadd132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmadd132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x98,0x71,0x7f]
- vfmadd132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vfmadd132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmadd132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmadd132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x98,0x72,0x80]
- vfmadd132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vfmadd132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmadd132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vfmadd132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vfmadd132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vfmadd132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vfmadd132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0x98,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vfmadd132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vfmadd132nepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vfmadd132bf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0x98,0x35,0x00,0x00,0x00,0x00]
- vfmadd132nepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vfmadd132bf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vfmadd132nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vfmadd132bf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0x98,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfmadd132nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vfmadd132bf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vfmadd132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmadd132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0x98,0x71,0x7f]
- vfmadd132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vfmadd132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmadd132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmadd132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0x98,0x72,0x80]
- vfmadd132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vfmadd132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmadd213nepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vfmadd213bf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xa8,0xf0]
- vfmadd213nepbf16 %ymm24, %ymm23, %ymm22
+ vfmadd213bf16 %ymm24, %ymm23, %ymm22
-// CHECK: vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vfmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xa8,0xf0]
- vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vfmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xa8,0xf0]
- vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vfmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmadd213nepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vfmadd213bf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xa8,0xf0]
- vfmadd213nepbf16 %zmm24, %zmm23, %zmm22
+ vfmadd213bf16 %zmm24, %zmm23, %zmm22
-// CHECK: vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vfmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xa8,0xf0]
- vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vfmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xa8,0xf0]
- vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vfmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmadd213nepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vfmadd213bf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xa8,0xf0]
- vfmadd213nepbf16 %xmm24, %xmm23, %xmm22
+ vfmadd213bf16 %xmm24, %xmm23, %xmm22
-// CHECK: vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vfmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xa8,0xf0]
- vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vfmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xa8,0xf0]
- vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vfmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmadd213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vfmadd213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vfmadd213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vfmadd213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vfmadd213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vfmadd213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vfmadd213nepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vfmadd213bf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xa8,0x35,0x00,0x00,0x00,0x00]
- vfmadd213nepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vfmadd213bf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vfmadd213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vfmadd213bf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xa8,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfmadd213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vfmadd213bf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vfmadd213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmadd213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xa8,0x71,0x7f]
- vfmadd213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vfmadd213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmadd213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmadd213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xa8,0x72,0x80]
- vfmadd213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vfmadd213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmadd213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vfmadd213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vfmadd213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vfmadd213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vfmadd213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vfmadd213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vfmadd213nepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vfmadd213bf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xa8,0x35,0x00,0x00,0x00,0x00]
- vfmadd213nepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vfmadd213bf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vfmadd213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vfmadd213bf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xa8,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfmadd213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vfmadd213bf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vfmadd213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmadd213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xa8,0x71,0x7f]
- vfmadd213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vfmadd213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmadd213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmadd213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xa8,0x72,0x80]
- vfmadd213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vfmadd213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmadd213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vfmadd213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vfmadd213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vfmadd213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vfmadd213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vfmadd213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vfmadd213nepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vfmadd213bf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xa8,0x35,0x00,0x00,0x00,0x00]
- vfmadd213nepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vfmadd213bf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vfmadd213nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vfmadd213bf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xa8,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfmadd213nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vfmadd213bf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vfmadd213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmadd213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xa8,0x71,0x7f]
- vfmadd213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vfmadd213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmadd213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmadd213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xa8,0x72,0x80]
- vfmadd213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vfmadd213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmadd231nepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vfmadd231bf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xb8,0xf0]
- vfmadd231nepbf16 %ymm24, %ymm23, %ymm22
+ vfmadd231bf16 %ymm24, %ymm23, %ymm22
-// CHECK: vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vfmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xb8,0xf0]
- vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vfmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xb8,0xf0]
- vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vfmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmadd231nepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vfmadd231bf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xb8,0xf0]
- vfmadd231nepbf16 %zmm24, %zmm23, %zmm22
+ vfmadd231bf16 %zmm24, %zmm23, %zmm22
-// CHECK: vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vfmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xb8,0xf0]
- vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vfmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xb8,0xf0]
- vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vfmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmadd231nepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vfmadd231bf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xb8,0xf0]
- vfmadd231nepbf16 %xmm24, %xmm23, %xmm22
+ vfmadd231bf16 %xmm24, %xmm23, %xmm22
-// CHECK: vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vfmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xb8,0xf0]
- vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vfmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xb8,0xf0]
- vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vfmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmadd231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vfmadd231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vfmadd231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vfmadd231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vfmadd231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vfmadd231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vfmadd231nepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vfmadd231bf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xb8,0x35,0x00,0x00,0x00,0x00]
- vfmadd231nepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vfmadd231bf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vfmadd231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vfmadd231bf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xb8,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfmadd231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vfmadd231bf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vfmadd231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmadd231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xb8,0x71,0x7f]
- vfmadd231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vfmadd231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmadd231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmadd231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xb8,0x72,0x80]
- vfmadd231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vfmadd231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmadd231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vfmadd231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vfmadd231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vfmadd231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vfmadd231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vfmadd231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vfmadd231nepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vfmadd231bf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xb8,0x35,0x00,0x00,0x00,0x00]
- vfmadd231nepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vfmadd231bf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vfmadd231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vfmadd231bf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xb8,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfmadd231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vfmadd231bf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vfmadd231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmadd231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xb8,0x71,0x7f]
- vfmadd231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vfmadd231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmadd231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmadd231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xb8,0x72,0x80]
- vfmadd231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vfmadd231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmadd231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vfmadd231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vfmadd231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vfmadd231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vfmadd231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vfmadd231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vfmadd231nepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vfmadd231bf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xb8,0x35,0x00,0x00,0x00,0x00]
- vfmadd231nepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vfmadd231bf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vfmadd231nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vfmadd231bf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xb8,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfmadd231nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vfmadd231bf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vfmadd231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmadd231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xb8,0x71,0x7f]
- vfmadd231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vfmadd231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmadd231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmadd231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xb8,0x72,0x80]
- vfmadd231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vfmadd231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmsub132nepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vfmsub132bf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x86,0x44,0x20,0x9a,0xf0]
- vfmsub132nepbf16 %ymm24, %ymm23, %ymm22
+ vfmsub132bf16 %ymm24, %ymm23, %ymm22
-// CHECK: vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vfmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x27,0x9a,0xf0]
- vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vfmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0x9a,0xf0]
- vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vfmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmsub132nepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vfmsub132bf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x86,0x44,0x40,0x9a,0xf0]
- vfmsub132nepbf16 %zmm24, %zmm23, %zmm22
+ vfmsub132bf16 %zmm24, %zmm23, %zmm22
-// CHECK: vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vfmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x47,0x9a,0xf0]
- vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vfmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0x9a,0xf0]
- vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vfmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmsub132nepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vfmsub132bf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x86,0x44,0x00,0x9a,0xf0]
- vfmsub132nepbf16 %xmm24, %xmm23, %xmm22
+ vfmsub132bf16 %xmm24, %xmm23, %xmm22
-// CHECK: vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vfmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x07,0x9a,0xf0]
- vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vfmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0x87,0x9a,0xf0]
- vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vfmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmsub132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vfmsub132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vfmsub132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vfmsub132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vfmsub132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vfmsub132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vfmsub132nepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vfmsub132bf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0x9a,0x35,0x00,0x00,0x00,0x00]
- vfmsub132nepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vfmsub132bf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vfmsub132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vfmsub132bf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0x9a,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfmsub132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vfmsub132bf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vfmsub132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmsub132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x9a,0x71,0x7f]
- vfmsub132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vfmsub132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmsub132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmsub132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x9a,0x72,0x80]
- vfmsub132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vfmsub132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmsub132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vfmsub132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vfmsub132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vfmsub132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vfmsub132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vfmsub132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vfmsub132nepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vfmsub132bf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0x9a,0x35,0x00,0x00,0x00,0x00]
- vfmsub132nepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vfmsub132bf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vfmsub132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vfmsub132bf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0x9a,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfmsub132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vfmsub132bf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vfmsub132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmsub132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x9a,0x71,0x7f]
- vfmsub132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vfmsub132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmsub132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmsub132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x9a,0x72,0x80]
- vfmsub132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vfmsub132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmsub132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vfmsub132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vfmsub132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vfmsub132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vfmsub132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vfmsub132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vfmsub132nepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vfmsub132bf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0x9a,0x35,0x00,0x00,0x00,0x00]
- vfmsub132nepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vfmsub132bf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vfmsub132nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vfmsub132bf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0x9a,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfmsub132nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vfmsub132bf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vfmsub132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmsub132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0x9a,0x71,0x7f]
- vfmsub132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vfmsub132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmsub132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmsub132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0x9a,0x72,0x80]
- vfmsub132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vfmsub132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmsub213nepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vfmsub213bf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xaa,0xf0]
- vfmsub213nepbf16 %ymm24, %ymm23, %ymm22
+ vfmsub213bf16 %ymm24, %ymm23, %ymm22
-// CHECK: vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vfmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xaa,0xf0]
- vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vfmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xaa,0xf0]
- vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vfmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmsub213nepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vfmsub213bf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xaa,0xf0]
- vfmsub213nepbf16 %zmm24, %zmm23, %zmm22
+ vfmsub213bf16 %zmm24, %zmm23, %zmm22
-// CHECK: vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vfmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xaa,0xf0]
- vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vfmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xaa,0xf0]
- vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vfmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmsub213nepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vfmsub213bf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xaa,0xf0]
- vfmsub213nepbf16 %xmm24, %xmm23, %xmm22
+ vfmsub213bf16 %xmm24, %xmm23, %xmm22
-// CHECK: vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vfmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xaa,0xf0]
- vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vfmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xaa,0xf0]
- vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vfmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmsub213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vfmsub213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vfmsub213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vfmsub213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vfmsub213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vfmsub213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vfmsub213nepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vfmsub213bf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xaa,0x35,0x00,0x00,0x00,0x00]
- vfmsub213nepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vfmsub213bf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vfmsub213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vfmsub213bf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xaa,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfmsub213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vfmsub213bf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vfmsub213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmsub213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xaa,0x71,0x7f]
- vfmsub213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vfmsub213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmsub213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmsub213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xaa,0x72,0x80]
- vfmsub213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vfmsub213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmsub213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vfmsub213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vfmsub213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vfmsub213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vfmsub213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vfmsub213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vfmsub213nepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vfmsub213bf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xaa,0x35,0x00,0x00,0x00,0x00]
- vfmsub213nepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vfmsub213bf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vfmsub213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vfmsub213bf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xaa,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfmsub213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vfmsub213bf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vfmsub213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmsub213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xaa,0x71,0x7f]
- vfmsub213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vfmsub213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmsub213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmsub213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xaa,0x72,0x80]
- vfmsub213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vfmsub213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmsub213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vfmsub213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vfmsub213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vfmsub213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vfmsub213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vfmsub213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vfmsub213nepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vfmsub213bf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xaa,0x35,0x00,0x00,0x00,0x00]
- vfmsub213nepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vfmsub213bf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vfmsub213nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vfmsub213bf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xaa,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfmsub213nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vfmsub213bf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vfmsub213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmsub213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xaa,0x71,0x7f]
- vfmsub213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vfmsub213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmsub213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmsub213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xaa,0x72,0x80]
- vfmsub213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vfmsub213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmsub231nepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vfmsub231bf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xba,0xf0]
- vfmsub231nepbf16 %ymm24, %ymm23, %ymm22
+ vfmsub231bf16 %ymm24, %ymm23, %ymm22
-// CHECK: vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vfmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xba,0xf0]
- vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vfmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xba,0xf0]
- vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vfmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmsub231nepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vfmsub231bf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xba,0xf0]
- vfmsub231nepbf16 %zmm24, %zmm23, %zmm22
+ vfmsub231bf16 %zmm24, %zmm23, %zmm22
-// CHECK: vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vfmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xba,0xf0]
- vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vfmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xba,0xf0]
- vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vfmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmsub231nepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vfmsub231bf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xba,0xf0]
- vfmsub231nepbf16 %xmm24, %xmm23, %xmm22
+ vfmsub231bf16 %xmm24, %xmm23, %xmm22
-// CHECK: vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vfmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xba,0xf0]
- vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vfmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xba,0xf0]
- vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vfmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmsub231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vfmsub231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vfmsub231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vfmsub231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vfmsub231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xba,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vfmsub231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vfmsub231nepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vfmsub231bf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xba,0x35,0x00,0x00,0x00,0x00]
- vfmsub231nepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vfmsub231bf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vfmsub231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vfmsub231bf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xba,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfmsub231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vfmsub231bf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vfmsub231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmsub231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xba,0x71,0x7f]
- vfmsub231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vfmsub231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmsub231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfmsub231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xba,0x72,0x80]
- vfmsub231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vfmsub231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfmsub231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vfmsub231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vfmsub231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vfmsub231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vfmsub231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xba,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vfmsub231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vfmsub231nepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vfmsub231bf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xba,0x35,0x00,0x00,0x00,0x00]
- vfmsub231nepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vfmsub231bf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vfmsub231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vfmsub231bf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xba,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfmsub231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vfmsub231bf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vfmsub231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmsub231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xba,0x71,0x7f]
- vfmsub231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vfmsub231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmsub231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfmsub231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xba,0x72,0x80]
- vfmsub231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vfmsub231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfmsub231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vfmsub231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vfmsub231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vfmsub231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vfmsub231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xba,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vfmsub231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vfmsub231nepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vfmsub231bf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xba,0x35,0x00,0x00,0x00,0x00]
- vfmsub231nepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vfmsub231bf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vfmsub231nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vfmsub231bf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xba,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfmsub231nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vfmsub231bf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vfmsub231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmsub231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xba,0x71,0x7f]
- vfmsub231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vfmsub231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfmsub231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfmsub231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xba,0x72,0x80]
- vfmsub231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vfmsub231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vfnmadd132bf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x86,0x44,0x20,0x9c,0xf0]
- vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22
+ vfnmadd132bf16 %ymm24, %ymm23, %ymm22
-// CHECK: vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vfnmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x27,0x9c,0xf0]
- vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vfnmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0x9c,0xf0]
- vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vfnmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vfnmadd132bf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x86,0x44,0x40,0x9c,0xf0]
- vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22
+ vfnmadd132bf16 %zmm24, %zmm23, %zmm22
-// CHECK: vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vfnmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x47,0x9c,0xf0]
- vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vfnmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0x9c,0xf0]
- vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vfnmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vfnmadd132bf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x86,0x44,0x00,0x9c,0xf0]
- vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22
+ vfnmadd132bf16 %xmm24, %xmm23, %xmm22
-// CHECK: vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vfnmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x07,0x9c,0xf0]
- vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vfnmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0x87,0x9c,0xf0]
- vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vfnmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vfnmadd132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vfnmadd132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vfnmadd132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vfnmadd132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vfnmadd132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vfnmadd132nepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vfnmadd132bf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0x9c,0x35,0x00,0x00,0x00,0x00]
- vfnmadd132nepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vfnmadd132bf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vfnmadd132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vfnmadd132bf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0x9c,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfnmadd132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vfnmadd132bf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vfnmadd132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmadd132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x9c,0x71,0x7f]
- vfnmadd132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vfnmadd132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmadd132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x9c,0x72,0x80]
- vfnmadd132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vfnmadd132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vfnmadd132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vfnmadd132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vfnmadd132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vfnmadd132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vfnmadd132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vfnmadd132nepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vfnmadd132bf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0x9c,0x35,0x00,0x00,0x00,0x00]
- vfnmadd132nepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vfnmadd132bf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vfnmadd132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vfnmadd132bf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0x9c,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfnmadd132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vfnmadd132bf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vfnmadd132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmadd132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x9c,0x71,0x7f]
- vfnmadd132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vfnmadd132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmadd132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x9c,0x72,0x80]
- vfnmadd132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vfnmadd132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vfnmadd132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vfnmadd132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vfnmadd132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vfnmadd132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vfnmadd132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vfnmadd132nepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vfnmadd132bf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0x9c,0x35,0x00,0x00,0x00,0x00]
- vfnmadd132nepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vfnmadd132bf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vfnmadd132nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vfnmadd132bf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0x9c,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfnmadd132nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vfnmadd132bf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vfnmadd132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmadd132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0x9c,0x71,0x7f]
- vfnmadd132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vfnmadd132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmadd132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmadd132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0x9c,0x72,0x80]
- vfnmadd132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vfnmadd132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vfnmadd213bf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xac,0xf0]
- vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22
+ vfnmadd213bf16 %ymm24, %ymm23, %ymm22
-// CHECK: vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vfnmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xac,0xf0]
- vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vfnmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xac,0xf0]
- vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vfnmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vfnmadd213bf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xac,0xf0]
- vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22
+ vfnmadd213bf16 %zmm24, %zmm23, %zmm22
-// CHECK: vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vfnmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xac,0xf0]
- vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vfnmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xac,0xf0]
- vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vfnmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vfnmadd213bf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xac,0xf0]
- vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22
+ vfnmadd213bf16 %xmm24, %xmm23, %xmm22
-// CHECK: vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vfnmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xac,0xf0]
- vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vfnmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xac,0xf0]
- vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vfnmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vfnmadd213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vfnmadd213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vfnmadd213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vfnmadd213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xac,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vfnmadd213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vfnmadd213nepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vfnmadd213bf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xac,0x35,0x00,0x00,0x00,0x00]
- vfnmadd213nepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vfnmadd213bf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vfnmadd213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vfnmadd213bf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xac,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfnmadd213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vfnmadd213bf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vfnmadd213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmadd213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xac,0x71,0x7f]
- vfnmadd213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vfnmadd213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmadd213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xac,0x72,0x80]
- vfnmadd213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vfnmadd213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vfnmadd213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vfnmadd213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vfnmadd213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vfnmadd213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xac,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vfnmadd213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vfnmadd213nepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vfnmadd213bf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xac,0x35,0x00,0x00,0x00,0x00]
- vfnmadd213nepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vfnmadd213bf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vfnmadd213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vfnmadd213bf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xac,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfnmadd213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vfnmadd213bf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vfnmadd213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmadd213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xac,0x71,0x7f]
- vfnmadd213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vfnmadd213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmadd213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xac,0x72,0x80]
- vfnmadd213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vfnmadd213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vfnmadd213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vfnmadd213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vfnmadd213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vfnmadd213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xac,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vfnmadd213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vfnmadd213nepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vfnmadd213bf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xac,0x35,0x00,0x00,0x00,0x00]
- vfnmadd213nepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vfnmadd213bf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vfnmadd213nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vfnmadd213bf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xac,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfnmadd213nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vfnmadd213bf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vfnmadd213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmadd213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xac,0x71,0x7f]
- vfnmadd213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vfnmadd213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmadd213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmadd213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xac,0x72,0x80]
- vfnmadd213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vfnmadd213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vfnmadd231bf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xbc,0xf0]
- vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22
+ vfnmadd231bf16 %ymm24, %ymm23, %ymm22
-// CHECK: vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vfnmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xbc,0xf0]
- vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vfnmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xbc,0xf0]
- vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vfnmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vfnmadd231bf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xbc,0xf0]
- vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22
+ vfnmadd231bf16 %zmm24, %zmm23, %zmm22
-// CHECK: vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vfnmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xbc,0xf0]
- vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vfnmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xbc,0xf0]
- vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vfnmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vfnmadd231bf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xbc,0xf0]
- vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22
+ vfnmadd231bf16 %xmm24, %xmm23, %xmm22
-// CHECK: vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vfnmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xbc,0xf0]
- vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vfnmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xbc,0xf0]
- vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vfnmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vfnmadd231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vfnmadd231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vfnmadd231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vfnmadd231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vfnmadd231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vfnmadd231nepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vfnmadd231bf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xbc,0x35,0x00,0x00,0x00,0x00]
- vfnmadd231nepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vfnmadd231bf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vfnmadd231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vfnmadd231bf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xbc,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfnmadd231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vfnmadd231bf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vfnmadd231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmadd231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xbc,0x71,0x7f]
- vfnmadd231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vfnmadd231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmadd231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xbc,0x72,0x80]
- vfnmadd231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vfnmadd231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vfnmadd231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vfnmadd231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vfnmadd231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vfnmadd231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vfnmadd231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vfnmadd231nepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vfnmadd231bf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xbc,0x35,0x00,0x00,0x00,0x00]
- vfnmadd231nepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vfnmadd231bf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vfnmadd231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vfnmadd231bf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xbc,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfnmadd231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vfnmadd231bf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vfnmadd231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmadd231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xbc,0x71,0x7f]
- vfnmadd231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vfnmadd231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmadd231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xbc,0x72,0x80]
- vfnmadd231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vfnmadd231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vfnmadd231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vfnmadd231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vfnmadd231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vfnmadd231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vfnmadd231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vfnmadd231nepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vfnmadd231bf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xbc,0x35,0x00,0x00,0x00,0x00]
- vfnmadd231nepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vfnmadd231bf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vfnmadd231nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vfnmadd231bf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xbc,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfnmadd231nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vfnmadd231bf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vfnmadd231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmadd231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xbc,0x71,0x7f]
- vfnmadd231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vfnmadd231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmadd231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmadd231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xbc,0x72,0x80]
- vfnmadd231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vfnmadd231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vfnmsub132bf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x86,0x44,0x20,0x9e,0xf0]
- vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22
+ vfnmsub132bf16 %ymm24, %ymm23, %ymm22
-// CHECK: vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vfnmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x27,0x9e,0xf0]
- vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vfnmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0x9e,0xf0]
- vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vfnmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vfnmsub132bf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x86,0x44,0x40,0x9e,0xf0]
- vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22
+ vfnmsub132bf16 %zmm24, %zmm23, %zmm22
-// CHECK: vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vfnmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x47,0x9e,0xf0]
- vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vfnmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0x9e,0xf0]
- vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vfnmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vfnmsub132bf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x86,0x44,0x00,0x9e,0xf0]
- vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22
+ vfnmsub132bf16 %xmm24, %xmm23, %xmm22
-// CHECK: vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vfnmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x07,0x9e,0xf0]
- vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vfnmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0x87,0x9e,0xf0]
- vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vfnmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vfnmsub132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vfnmsub132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vfnmsub132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vfnmsub132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vfnmsub132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vfnmsub132nepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vfnmsub132bf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0x9e,0x35,0x00,0x00,0x00,0x00]
- vfnmsub132nepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vfnmsub132bf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vfnmsub132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vfnmsub132bf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0x9e,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfnmsub132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vfnmsub132bf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vfnmsub132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmsub132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x9e,0x71,0x7f]
- vfnmsub132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vfnmsub132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmsub132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x9e,0x72,0x80]
- vfnmsub132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vfnmsub132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vfnmsub132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vfnmsub132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vfnmsub132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vfnmsub132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vfnmsub132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vfnmsub132nepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vfnmsub132bf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0x9e,0x35,0x00,0x00,0x00,0x00]
- vfnmsub132nepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vfnmsub132bf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vfnmsub132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vfnmsub132bf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0x9e,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfnmsub132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vfnmsub132bf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vfnmsub132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmsub132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x9e,0x71,0x7f]
- vfnmsub132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vfnmsub132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmsub132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x9e,0x72,0x80]
- vfnmsub132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vfnmsub132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vfnmsub132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vfnmsub132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vfnmsub132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vfnmsub132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vfnmsub132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vfnmsub132nepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vfnmsub132bf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0x9e,0x35,0x00,0x00,0x00,0x00]
- vfnmsub132nepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vfnmsub132bf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vfnmsub132nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vfnmsub132bf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0x9e,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfnmsub132nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vfnmsub132bf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vfnmsub132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmsub132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0x9e,0x71,0x7f]
- vfnmsub132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vfnmsub132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmsub132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmsub132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0x9e,0x72,0x80]
- vfnmsub132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vfnmsub132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vfnmsub213bf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xae,0xf0]
- vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22
+ vfnmsub213bf16 %ymm24, %ymm23, %ymm22
-// CHECK: vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vfnmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xae,0xf0]
- vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vfnmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xae,0xf0]
- vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vfnmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vfnmsub213bf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xae,0xf0]
- vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22
+ vfnmsub213bf16 %zmm24, %zmm23, %zmm22
-// CHECK: vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vfnmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xae,0xf0]
- vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vfnmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xae,0xf0]
- vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vfnmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vfnmsub213bf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xae,0xf0]
- vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22
+ vfnmsub213bf16 %xmm24, %xmm23, %xmm22
-// CHECK: vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vfnmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xae,0xf0]
- vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vfnmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xae,0xf0]
- vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vfnmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vfnmsub213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vfnmsub213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vfnmsub213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vfnmsub213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xae,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vfnmsub213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vfnmsub213nepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vfnmsub213bf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xae,0x35,0x00,0x00,0x00,0x00]
- vfnmsub213nepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vfnmsub213bf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vfnmsub213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vfnmsub213bf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xae,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfnmsub213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vfnmsub213bf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vfnmsub213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmsub213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xae,0x71,0x7f]
- vfnmsub213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vfnmsub213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmsub213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xae,0x72,0x80]
- vfnmsub213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vfnmsub213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vfnmsub213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vfnmsub213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vfnmsub213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vfnmsub213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xae,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vfnmsub213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vfnmsub213nepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vfnmsub213bf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xae,0x35,0x00,0x00,0x00,0x00]
- vfnmsub213nepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vfnmsub213bf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vfnmsub213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vfnmsub213bf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xae,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfnmsub213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vfnmsub213bf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vfnmsub213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmsub213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xae,0x71,0x7f]
- vfnmsub213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vfnmsub213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmsub213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xae,0x72,0x80]
- vfnmsub213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vfnmsub213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vfnmsub213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vfnmsub213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vfnmsub213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vfnmsub213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xae,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vfnmsub213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vfnmsub213nepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vfnmsub213bf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xae,0x35,0x00,0x00,0x00,0x00]
- vfnmsub213nepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vfnmsub213bf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vfnmsub213nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vfnmsub213bf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xae,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfnmsub213nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vfnmsub213bf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vfnmsub213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmsub213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xae,0x71,0x7f]
- vfnmsub213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vfnmsub213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmsub213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmsub213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xae,0x72,0x80]
- vfnmsub213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vfnmsub213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vfnmsub231bf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xbe,0xf0]
- vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22
+ vfnmsub231bf16 %ymm24, %ymm23, %ymm22
-// CHECK: vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vfnmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xbe,0xf0]
- vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vfnmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xbe,0xf0]
- vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vfnmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vfnmsub231bf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xbe,0xf0]
- vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22
+ vfnmsub231bf16 %zmm24, %zmm23, %zmm22
-// CHECK: vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vfnmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xbe,0xf0]
- vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vfnmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xbe,0xf0]
- vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vfnmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vfnmsub231bf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xbe,0xf0]
- vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22
+ vfnmsub231bf16 %xmm24, %xmm23, %xmm22
-// CHECK: vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vfnmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xbe,0xf0]
- vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vfnmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xbe,0xf0]
- vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vfnmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vfnmsub231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vfnmsub231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vfnmsub231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vfnmsub231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vfnmsub231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vfnmsub231nepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vfnmsub231bf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xbe,0x35,0x00,0x00,0x00,0x00]
- vfnmsub231nepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vfnmsub231bf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vfnmsub231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vfnmsub231bf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xbe,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfnmsub231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vfnmsub231bf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vfnmsub231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmsub231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xbe,0x71,0x7f]
- vfnmsub231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vfnmsub231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vfnmsub231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xbe,0x72,0x80]
- vfnmsub231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vfnmsub231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vfnmsub231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vfnmsub231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vfnmsub231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vfnmsub231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vfnmsub231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vfnmsub231nepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vfnmsub231bf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xbe,0x35,0x00,0x00,0x00,0x00]
- vfnmsub231nepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vfnmsub231bf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vfnmsub231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vfnmsub231bf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xbe,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfnmsub231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vfnmsub231bf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vfnmsub231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmsub231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xbe,0x71,0x7f]
- vfnmsub231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vfnmsub231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vfnmsub231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xbe,0x72,0x80]
- vfnmsub231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vfnmsub231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vfnmsub231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vfnmsub231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vfnmsub231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vfnmsub231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vfnmsub231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vfnmsub231nepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vfnmsub231bf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xbe,0x35,0x00,0x00,0x00,0x00]
- vfnmsub231nepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vfnmsub231bf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vfnmsub231nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vfnmsub231bf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xbe,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfnmsub231nepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vfnmsub231bf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vfnmsub231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmsub231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xbe,0x71,0x7f]
- vfnmsub231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vfnmsub231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfnmsub231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vfnmsub231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xbe,0x72,0x80]
- vfnmsub231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vfnmsub231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vfpclasspbf16 $123, %zmm23, %k5
+// CHECK: vfpclassbf16 $123, %zmm23, %k5
// CHECK: encoding: [0x62,0xb3,0x7f,0x48,0x66,0xef,0x7b]
- vfpclasspbf16 $123, %zmm23, %k5
+ vfpclassbf16 $123, %zmm23, %k5
-// CHECK: vfpclasspbf16 $123, %zmm23, %k5 {%k7}
+// CHECK: vfpclassbf16 $123, %zmm23, %k5 {%k7}
// CHECK: encoding: [0x62,0xb3,0x7f,0x4f,0x66,0xef,0x7b]
- vfpclasspbf16 $123, %zmm23, %k5 {%k7}
+ vfpclassbf16 $123, %zmm23, %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, %ymm23, %k5
+// CHECK: vfpclassbf16 $123, %ymm23, %k5
// CHECK: encoding: [0x62,0xb3,0x7f,0x28,0x66,0xef,0x7b]
- vfpclasspbf16 $123, %ymm23, %k5
+ vfpclassbf16 $123, %ymm23, %k5
-// CHECK: vfpclasspbf16 $123, %ymm23, %k5 {%k7}
+// CHECK: vfpclassbf16 $123, %ymm23, %k5 {%k7}
// CHECK: encoding: [0x62,0xb3,0x7f,0x2f,0x66,0xef,0x7b]
- vfpclasspbf16 $123, %ymm23, %k5 {%k7}
+ vfpclassbf16 $123, %ymm23, %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, %xmm23, %k5
+// CHECK: vfpclassbf16 $123, %xmm23, %k5
// CHECK: encoding: [0x62,0xb3,0x7f,0x08,0x66,0xef,0x7b]
- vfpclasspbf16 $123, %xmm23, %k5
+ vfpclassbf16 $123, %xmm23, %k5
-// CHECK: vfpclasspbf16 $123, %xmm23, %k5 {%k7}
+// CHECK: vfpclassbf16 $123, %xmm23, %k5 {%k7}
// CHECK: encoding: [0x62,0xb3,0x7f,0x0f,0x66,0xef,0x7b]
- vfpclasspbf16 $123, %xmm23, %k5 {%k7}
+ vfpclassbf16 $123, %xmm23, %k5 {%k7}
-// CHECK: vfpclasspbf16x $123, 268435456(%rbp,%r14,8), %k5
+// CHECK: vfpclassbf16x $123, 268435456(%rbp,%r14,8), %k5
// CHECK: encoding: [0x62,0xb3,0x7f,0x08,0x66,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vfpclasspbf16x $123, 268435456(%rbp,%r14,8), %k5
+ vfpclassbf16x $123, 268435456(%rbp,%r14,8), %k5
-// CHECK: vfpclasspbf16x $123, 291(%r8,%rax,4), %k5 {%k7}
+// CHECK: vfpclassbf16x $123, 291(%r8,%rax,4), %k5 {%k7}
// CHECK: encoding: [0x62,0xd3,0x7f,0x0f,0x66,0xac,0x80,0x23,0x01,0x00,0x00,0x7b]
- vfpclasspbf16x $123, 291(%r8,%rax,4), %k5 {%k7}
+ vfpclassbf16x $123, 291(%r8,%rax,4), %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, (%rip){1to8}, %k5
+// CHECK: vfpclassbf16 $123, (%rip){1to8}, %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b]
- vfpclasspbf16 $123, (%rip){1to8}, %k5
+ vfpclassbf16 $123, (%rip){1to8}, %k5
-// CHECK: vfpclasspbf16x $123, -512(,%rbp,2), %k5
+// CHECK: vfpclassbf16x $123, -512(,%rbp,2), %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vfpclasspbf16x $123, -512(,%rbp,2), %k5
+ vfpclassbf16x $123, -512(,%rbp,2), %k5
-// CHECK: vfpclasspbf16x $123, 2032(%rcx), %k5 {%k7}
+// CHECK: vfpclassbf16x $123, 2032(%rcx), %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0x69,0x7f,0x7b]
- vfpclasspbf16x $123, 2032(%rcx), %k5 {%k7}
+ vfpclassbf16x $123, 2032(%rcx), %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, -256(%rdx){1to8}, %k5 {%k7}
+// CHECK: vfpclassbf16 $123, -256(%rdx){1to8}, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x1f,0x66,0x6a,0x80,0x7b]
- vfpclasspbf16 $123, -256(%rdx){1to8}, %k5 {%k7}
+ vfpclassbf16 $123, -256(%rdx){1to8}, %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, (%rip){1to16}, %k5
+// CHECK: vfpclassbf16 $123, (%rip){1to16}, %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b]
- vfpclasspbf16 $123, (%rip){1to16}, %k5
+ vfpclassbf16 $123, (%rip){1to16}, %k5
-// CHECK: vfpclasspbf16y $123, -1024(,%rbp,2), %k5
+// CHECK: vfpclassbf16y $123, -1024(,%rbp,2), %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x66,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vfpclasspbf16y $123, -1024(,%rbp,2), %k5
+ vfpclassbf16y $123, -1024(,%rbp,2), %k5
-// CHECK: vfpclasspbf16y $123, 4064(%rcx), %k5 {%k7}
+// CHECK: vfpclassbf16y $123, 4064(%rcx), %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x66,0x69,0x7f,0x7b]
- vfpclasspbf16y $123, 4064(%rcx), %k5 {%k7}
+ vfpclassbf16y $123, 4064(%rcx), %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, -256(%rdx){1to16}, %k5 {%k7}
+// CHECK: vfpclassbf16 $123, -256(%rdx){1to16}, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x3f,0x66,0x6a,0x80,0x7b]
- vfpclasspbf16 $123, -256(%rdx){1to16}, %k5 {%k7}
+ vfpclassbf16 $123, -256(%rdx){1to16}, %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, (%rip){1to32}, %k5
+// CHECK: vfpclassbf16 $123, (%rip){1to32}, %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b]
- vfpclasspbf16 $123, (%rip){1to32}, %k5
+ vfpclassbf16 $123, (%rip){1to32}, %k5
-// CHECK: vfpclasspbf16z $123, -2048(,%rbp,2), %k5
+// CHECK: vfpclassbf16z $123, -2048(,%rbp,2), %k5
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x66,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vfpclasspbf16z $123, -2048(,%rbp,2), %k5
+ vfpclassbf16z $123, -2048(,%rbp,2), %k5
-// CHECK: vfpclasspbf16z $123, 8128(%rcx), %k5 {%k7}
+// CHECK: vfpclassbf16z $123, 8128(%rcx), %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x66,0x69,0x7f,0x7b]
- vfpclasspbf16z $123, 8128(%rcx), %k5 {%k7}
+ vfpclassbf16z $123, 8128(%rcx), %k5 {%k7}
-// CHECK: vfpclasspbf16 $123, -256(%rdx){1to32}, %k5 {%k7}
+// CHECK: vfpclassbf16 $123, -256(%rdx){1to32}, %k5 {%k7}
// CHECK: encoding: [0x62,0xf3,0x7f,0x5f,0x66,0x6a,0x80,0x7b]
- vfpclasspbf16 $123, -256(%rdx){1to32}, %k5 {%k7}
+ vfpclassbf16 $123, -256(%rdx){1to32}, %k5 {%k7}
-// CHECK: vgetexppbf16 %xmm23, %xmm22
+// CHECK: vgetexpbf16 %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x42,0xf7]
- vgetexppbf16 %xmm23, %xmm22
+ vgetexpbf16 %xmm23, %xmm22
-// CHECK: vgetexppbf16 %xmm23, %xmm22 {%k7}
+// CHECK: vgetexpbf16 %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xa5,0x7d,0x0f,0x42,0xf7]
- vgetexppbf16 %xmm23, %xmm22 {%k7}
+ vgetexpbf16 %xmm23, %xmm22 {%k7}
-// CHECK: vgetexppbf16 %xmm23, %xmm22 {%k7} {z}
+// CHECK: vgetexpbf16 %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa5,0x7d,0x8f,0x42,0xf7]
- vgetexppbf16 %xmm23, %xmm22 {%k7} {z}
+ vgetexpbf16 %xmm23, %xmm22 {%k7} {z}
-// CHECK: vgetexppbf16 %zmm23, %zmm22
+// CHECK: vgetexpbf16 %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x42,0xf7]
- vgetexppbf16 %zmm23, %zmm22
+ vgetexpbf16 %zmm23, %zmm22
-// CHECK: vgetexppbf16 %zmm23, %zmm22 {%k7}
+// CHECK: vgetexpbf16 %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xa5,0x7d,0x4f,0x42,0xf7]
- vgetexppbf16 %zmm23, %zmm22 {%k7}
+ vgetexpbf16 %zmm23, %zmm22 {%k7}
-// CHECK: vgetexppbf16 %zmm23, %zmm22 {%k7} {z}
+// CHECK: vgetexpbf16 %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa5,0x7d,0xcf,0x42,0xf7]
- vgetexppbf16 %zmm23, %zmm22 {%k7} {z}
+ vgetexpbf16 %zmm23, %zmm22 {%k7} {z}
-// CHECK: vgetexppbf16 %ymm23, %ymm22
+// CHECK: vgetexpbf16 %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x42,0xf7]
- vgetexppbf16 %ymm23, %ymm22
+ vgetexpbf16 %ymm23, %ymm22
-// CHECK: vgetexppbf16 %ymm23, %ymm22 {%k7}
+// CHECK: vgetexpbf16 %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xa5,0x7d,0x2f,0x42,0xf7]
- vgetexppbf16 %ymm23, %ymm22 {%k7}
+ vgetexpbf16 %ymm23, %ymm22 {%k7}
-// CHECK: vgetexppbf16 %ymm23, %ymm22 {%k7} {z}
+// CHECK: vgetexpbf16 %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa5,0x7d,0xaf,0x42,0xf7]
- vgetexppbf16 %ymm23, %ymm22 {%k7} {z}
+ vgetexpbf16 %ymm23, %ymm22 {%k7} {z}
-// CHECK: vgetexppbf16 268435456(%rbp,%r14,8), %xmm22
+// CHECK: vgetexpbf16 268435456(%rbp,%r14,8), %xmm22
// CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vgetexppbf16 268435456(%rbp,%r14,8), %xmm22
+ vgetexpbf16 268435456(%rbp,%r14,8), %xmm22
-// CHECK: vgetexppbf16 291(%r8,%rax,4), %xmm22 {%k7}
+// CHECK: vgetexpbf16 291(%r8,%rax,4), %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x7d,0x0f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00]
- vgetexppbf16 291(%r8,%rax,4), %xmm22 {%k7}
+ vgetexpbf16 291(%r8,%rax,4), %xmm22 {%k7}
-// CHECK: vgetexppbf16 (%rip){1to8}, %xmm22
+// CHECK: vgetexpbf16 (%rip){1to8}, %xmm22
// CHECK: encoding: [0x62,0xe5,0x7d,0x18,0x42,0x35,0x00,0x00,0x00,0x00]
- vgetexppbf16 (%rip){1to8}, %xmm22
+ vgetexpbf16 (%rip){1to8}, %xmm22
-// CHECK: vgetexppbf16 -512(,%rbp,2), %xmm22
+// CHECK: vgetexpbf16 -512(,%rbp,2), %xmm22
// CHECK: encoding: [0x62,0xe5,0x7d,0x08,0x42,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vgetexppbf16 -512(,%rbp,2), %xmm22
+ vgetexpbf16 -512(,%rbp,2), %xmm22
-// CHECK: vgetexppbf16 2032(%rcx), %xmm22 {%k7} {z}
+// CHECK: vgetexpbf16 2032(%rcx), %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x7d,0x8f,0x42,0x71,0x7f]
- vgetexppbf16 2032(%rcx), %xmm22 {%k7} {z}
+ vgetexpbf16 2032(%rcx), %xmm22 {%k7} {z}
-// CHECK: vgetexppbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
+// CHECK: vgetexpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x7d,0x9f,0x42,0x72,0x80]
- vgetexppbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
+ vgetexpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
-// CHECK: vgetexppbf16 268435456(%rbp,%r14,8), %ymm22
+// CHECK: vgetexpbf16 268435456(%rbp,%r14,8), %ymm22
// CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vgetexppbf16 268435456(%rbp,%r14,8), %ymm22
+ vgetexpbf16 268435456(%rbp,%r14,8), %ymm22
-// CHECK: vgetexppbf16 291(%r8,%rax,4), %ymm22 {%k7}
+// CHECK: vgetexpbf16 291(%r8,%rax,4), %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x7d,0x2f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00]
- vgetexppbf16 291(%r8,%rax,4), %ymm22 {%k7}
+ vgetexpbf16 291(%r8,%rax,4), %ymm22 {%k7}
-// CHECK: vgetexppbf16 (%rip){1to16}, %ymm22
+// CHECK: vgetexpbf16 (%rip){1to16}, %ymm22
// CHECK: encoding: [0x62,0xe5,0x7d,0x38,0x42,0x35,0x00,0x00,0x00,0x00]
- vgetexppbf16 (%rip){1to16}, %ymm22
+ vgetexpbf16 (%rip){1to16}, %ymm22
-// CHECK: vgetexppbf16 -1024(,%rbp,2), %ymm22
+// CHECK: vgetexpbf16 -1024(,%rbp,2), %ymm22
// CHECK: encoding: [0x62,0xe5,0x7d,0x28,0x42,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vgetexppbf16 -1024(,%rbp,2), %ymm22
+ vgetexpbf16 -1024(,%rbp,2), %ymm22
-// CHECK: vgetexppbf16 4064(%rcx), %ymm22 {%k7} {z}
+// CHECK: vgetexpbf16 4064(%rcx), %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x7d,0xaf,0x42,0x71,0x7f]
- vgetexppbf16 4064(%rcx), %ymm22 {%k7} {z}
+ vgetexpbf16 4064(%rcx), %ymm22 {%k7} {z}
-// CHECK: vgetexppbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
+// CHECK: vgetexpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x7d,0xbf,0x42,0x72,0x80]
- vgetexppbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
+ vgetexpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
-// CHECK: vgetexppbf16 268435456(%rbp,%r14,8), %zmm22
+// CHECK: vgetexpbf16 268435456(%rbp,%r14,8), %zmm22
// CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vgetexppbf16 268435456(%rbp,%r14,8), %zmm22
+ vgetexpbf16 268435456(%rbp,%r14,8), %zmm22
-// CHECK: vgetexppbf16 291(%r8,%rax,4), %zmm22 {%k7}
+// CHECK: vgetexpbf16 291(%r8,%rax,4), %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x7d,0x4f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00]
- vgetexppbf16 291(%r8,%rax,4), %zmm22 {%k7}
+ vgetexpbf16 291(%r8,%rax,4), %zmm22 {%k7}
-// CHECK: vgetexppbf16 (%rip){1to32}, %zmm22
+// CHECK: vgetexpbf16 (%rip){1to32}, %zmm22
// CHECK: encoding: [0x62,0xe5,0x7d,0x58,0x42,0x35,0x00,0x00,0x00,0x00]
- vgetexppbf16 (%rip){1to32}, %zmm22
+ vgetexpbf16 (%rip){1to32}, %zmm22
-// CHECK: vgetexppbf16 -2048(,%rbp,2), %zmm22
+// CHECK: vgetexpbf16 -2048(,%rbp,2), %zmm22
// CHECK: encoding: [0x62,0xe5,0x7d,0x48,0x42,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vgetexppbf16 -2048(,%rbp,2), %zmm22
+ vgetexpbf16 -2048(,%rbp,2), %zmm22
-// CHECK: vgetexppbf16 8128(%rcx), %zmm22 {%k7} {z}
+// CHECK: vgetexpbf16 8128(%rcx), %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x7d,0xcf,0x42,0x71,0x7f]
- vgetexppbf16 8128(%rcx), %zmm22 {%k7} {z}
+ vgetexpbf16 8128(%rcx), %zmm22 {%k7} {z}
-// CHECK: vgetexppbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
+// CHECK: vgetexpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x7d,0xdf,0x42,0x72,0x80]
- vgetexppbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
+ vgetexpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, %zmm23, %zmm22
+// CHECK: vgetmantbf16 $123, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x26,0xf7,0x7b]
- vgetmantpbf16 $123, %zmm23, %zmm22
+ vgetmantbf16 $123, %zmm23, %zmm22
-// CHECK: vgetmantpbf16 $123, %zmm23, %zmm22 {%k7}
+// CHECK: vgetmantbf16 $123, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xa3,0x7f,0x4f,0x26,0xf7,0x7b]
- vgetmantpbf16 $123, %zmm23, %zmm22 {%k7}
+ vgetmantbf16 $123, %zmm23, %zmm22 {%k7}
-// CHECK: vgetmantpbf16 $123, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vgetmantbf16 $123, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa3,0x7f,0xcf,0x26,0xf7,0x7b]
- vgetmantpbf16 $123, %zmm23, %zmm22 {%k7} {z}
+ vgetmantbf16 $123, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, %ymm23, %ymm22
+// CHECK: vgetmantbf16 $123, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x26,0xf7,0x7b]
- vgetmantpbf16 $123, %ymm23, %ymm22
+ vgetmantbf16 $123, %ymm23, %ymm22
-// CHECK: vgetmantpbf16 $123, %ymm23, %ymm22 {%k7}
+// CHECK: vgetmantbf16 $123, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xa3,0x7f,0x2f,0x26,0xf7,0x7b]
- vgetmantpbf16 $123, %ymm23, %ymm22 {%k7}
+ vgetmantbf16 $123, %ymm23, %ymm22 {%k7}
-// CHECK: vgetmantpbf16 $123, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vgetmantbf16 $123, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa3,0x7f,0xaf,0x26,0xf7,0x7b]
- vgetmantpbf16 $123, %ymm23, %ymm22 {%k7} {z}
+ vgetmantbf16 $123, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, %xmm23, %xmm22
+// CHECK: vgetmantbf16 $123, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x26,0xf7,0x7b]
- vgetmantpbf16 $123, %xmm23, %xmm22
+ vgetmantbf16 $123, %xmm23, %xmm22
-// CHECK: vgetmantpbf16 $123, %xmm23, %xmm22 {%k7}
+// CHECK: vgetmantbf16 $123, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xa3,0x7f,0x0f,0x26,0xf7,0x7b]
- vgetmantpbf16 $123, %xmm23, %xmm22 {%k7}
+ vgetmantbf16 $123, %xmm23, %xmm22 {%k7}
-// CHECK: vgetmantpbf16 $123, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vgetmantbf16 $123, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa3,0x7f,0x8f,0x26,0xf7,0x7b]
- vgetmantpbf16 $123, %xmm23, %xmm22 {%k7} {z}
+ vgetmantbf16 $123, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %xmm22
+// CHECK: vgetmantbf16 $123, 268435456(%rbp,%r14,8), %xmm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %xmm22
+ vgetmantbf16 $123, 268435456(%rbp,%r14,8), %xmm22
-// CHECK: vgetmantpbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
+// CHECK: vgetmantbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc3,0x7f,0x0f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vgetmantpbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
+ vgetmantbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
-// CHECK: vgetmantpbf16 $123, (%rip){1to8}, %xmm22
+// CHECK: vgetmantbf16 $123, (%rip){1to8}, %xmm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x18,0x26,0x35,0x00,0x00,0x00,0x00,0x7b]
- vgetmantpbf16 $123, (%rip){1to8}, %xmm22
+ vgetmantbf16 $123, (%rip){1to8}, %xmm22
-// CHECK: vgetmantpbf16 $123, -512(,%rbp,2), %xmm22
+// CHECK: vgetmantbf16 $123, -512(,%rbp,2), %xmm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x08,0x26,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vgetmantpbf16 $123, -512(,%rbp,2), %xmm22
+ vgetmantbf16 $123, -512(,%rbp,2), %xmm22
-// CHECK: vgetmantpbf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
+// CHECK: vgetmantbf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0x8f,0x26,0x71,0x7f,0x7b]
- vgetmantpbf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
+ vgetmantbf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
+// CHECK: vgetmantbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0x9f,0x26,0x72,0x80,0x7b]
- vgetmantpbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
+ vgetmantbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %ymm22
+// CHECK: vgetmantbf16 $123, 268435456(%rbp,%r14,8), %ymm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %ymm22
+ vgetmantbf16 $123, 268435456(%rbp,%r14,8), %ymm22
-// CHECK: vgetmantpbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
+// CHECK: vgetmantbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc3,0x7f,0x2f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vgetmantpbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
+ vgetmantbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
-// CHECK: vgetmantpbf16 $123, (%rip){1to16}, %ymm22
+// CHECK: vgetmantbf16 $123, (%rip){1to16}, %ymm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x38,0x26,0x35,0x00,0x00,0x00,0x00,0x7b]
- vgetmantpbf16 $123, (%rip){1to16}, %ymm22
+ vgetmantbf16 $123, (%rip){1to16}, %ymm22
-// CHECK: vgetmantpbf16 $123, -1024(,%rbp,2), %ymm22
+// CHECK: vgetmantbf16 $123, -1024(,%rbp,2), %ymm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x28,0x26,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vgetmantpbf16 $123, -1024(,%rbp,2), %ymm22
+ vgetmantbf16 $123, -1024(,%rbp,2), %ymm22
-// CHECK: vgetmantpbf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
+// CHECK: vgetmantbf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0xaf,0x26,0x71,0x7f,0x7b]
- vgetmantpbf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
+ vgetmantbf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
+// CHECK: vgetmantbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0xbf,0x26,0x72,0x80,0x7b]
- vgetmantpbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
+ vgetmantbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %zmm22
+// CHECK: vgetmantbf16 $123, 268435456(%rbp,%r14,8), %zmm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %zmm22
+ vgetmantbf16 $123, 268435456(%rbp,%r14,8), %zmm22
-// CHECK: vgetmantpbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
+// CHECK: vgetmantbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc3,0x7f,0x4f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vgetmantpbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
+ vgetmantbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
-// CHECK: vgetmantpbf16 $123, (%rip){1to32}, %zmm22
+// CHECK: vgetmantbf16 $123, (%rip){1to32}, %zmm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x58,0x26,0x35,0x00,0x00,0x00,0x00,0x7b]
- vgetmantpbf16 $123, (%rip){1to32}, %zmm22
+ vgetmantbf16 $123, (%rip){1to32}, %zmm22
-// CHECK: vgetmantpbf16 $123, -2048(,%rbp,2), %zmm22
+// CHECK: vgetmantbf16 $123, -2048(,%rbp,2), %zmm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x48,0x26,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vgetmantpbf16 $123, -2048(,%rbp,2), %zmm22
+ vgetmantbf16 $123, -2048(,%rbp,2), %zmm22
-// CHECK: vgetmantpbf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
+// CHECK: vgetmantbf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0xcf,0x26,0x71,0x7f,0x7b]
- vgetmantpbf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
+ vgetmantbf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
-// CHECK: vgetmantpbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
+// CHECK: vgetmantbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0xdf,0x26,0x72,0x80,0x7b]
- vgetmantpbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
+ vgetmantbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
-// CHECK: vmaxpbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vmaxbf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x85,0x45,0x20,0x5f,0xf0]
- vmaxpbf16 %ymm24, %ymm23, %ymm22
+ vmaxbf16 %ymm24, %ymm23, %ymm22
-// CHECK: vmaxpbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vmaxbf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x27,0x5f,0xf0]
- vmaxpbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vmaxbf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vmaxpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vmaxbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5f,0xf0]
- vmaxpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vmaxbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vmaxpbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vmaxbf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x85,0x45,0x40,0x5f,0xf0]
- vmaxpbf16 %zmm24, %zmm23, %zmm22
+ vmaxbf16 %zmm24, %zmm23, %zmm22
-// CHECK: vmaxpbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vmaxbf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x47,0x5f,0xf0]
- vmaxpbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vmaxbf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vmaxpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vmaxbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5f,0xf0]
- vmaxpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vmaxbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vmaxpbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vmaxbf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x85,0x45,0x00,0x5f,0xf0]
- vmaxpbf16 %xmm24, %xmm23, %xmm22
+ vmaxbf16 %xmm24, %xmm23, %xmm22
-// CHECK: vmaxpbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vmaxbf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x07,0x5f,0xf0]
- vmaxpbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vmaxbf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vmaxpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vmaxbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0x87,0x5f,0xf0]
- vmaxpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vmaxbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vmaxpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vmaxbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vmaxpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vmaxbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vmaxpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vmaxbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00]
- vmaxpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vmaxbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vmaxpbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vmaxbf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5f,0x35,0x00,0x00,0x00,0x00]
- vmaxpbf16 (%rip){1to32}, %zmm23, %zmm22
+ vmaxbf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vmaxpbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vmaxbf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5f,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vmaxpbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vmaxbf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vmaxpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vmaxbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5f,0x71,0x7f]
- vmaxpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vmaxbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vmaxpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vmaxbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5f,0x72,0x80]
- vmaxpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vmaxbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vmaxpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vmaxbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vmaxpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vmaxbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vmaxpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vmaxbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00]
- vmaxpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vmaxbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vmaxpbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vmaxbf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5f,0x35,0x00,0x00,0x00,0x00]
- vmaxpbf16 (%rip){1to16}, %ymm23, %ymm22
+ vmaxbf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vmaxpbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vmaxbf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5f,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vmaxpbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vmaxbf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vmaxpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vmaxbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5f,0x71,0x7f]
- vmaxpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vmaxbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vmaxpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vmaxbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5f,0x72,0x80]
- vmaxpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vmaxbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vmaxpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vmaxbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vmaxpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vmaxbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vmaxpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vmaxbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00]
- vmaxpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vmaxbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vmaxpbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vmaxbf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5f,0x35,0x00,0x00,0x00,0x00]
- vmaxpbf16 (%rip){1to8}, %xmm23, %xmm22
+ vmaxbf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vmaxpbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vmaxbf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5f,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vmaxpbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vmaxbf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vmaxpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vmaxbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5f,0x71,0x7f]
- vmaxpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vmaxbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vmaxpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vmaxbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5f,0x72,0x80]
- vmaxpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vmaxbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vminpbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vminbf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x85,0x45,0x20,0x5d,0xf0]
- vminpbf16 %ymm24, %ymm23, %ymm22
+ vminbf16 %ymm24, %ymm23, %ymm22
-// CHECK: vminpbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vminbf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x27,0x5d,0xf0]
- vminpbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vminbf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vminpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vminbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5d,0xf0]
- vminpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vminbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vminpbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vminbf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x85,0x45,0x40,0x5d,0xf0]
- vminpbf16 %zmm24, %zmm23, %zmm22
+ vminbf16 %zmm24, %zmm23, %zmm22
-// CHECK: vminpbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vminbf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x47,0x5d,0xf0]
- vminpbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vminbf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vminpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vminbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5d,0xf0]
- vminpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vminbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vminpbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vminbf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x85,0x45,0x00,0x5d,0xf0]
- vminpbf16 %xmm24, %xmm23, %xmm22
+ vminbf16 %xmm24, %xmm23, %xmm22
-// CHECK: vminpbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vminbf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x07,0x5d,0xf0]
- vminpbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vminbf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vminpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vminbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0x87,0x5d,0xf0]
- vminpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vminbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vminpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vminbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vminpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vminbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vminpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vminbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00]
- vminpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vminbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vminpbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vminbf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5d,0x35,0x00,0x00,0x00,0x00]
- vminpbf16 (%rip){1to32}, %zmm23, %zmm22
+ vminbf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vminpbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vminbf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5d,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vminpbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vminbf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vminpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vminbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5d,0x71,0x7f]
- vminpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vminbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vminpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vminbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5d,0x72,0x80]
- vminpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vminbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vminpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vminbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vminpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vminbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vminpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vminbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00]
- vminpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vminbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vminpbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vminbf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5d,0x35,0x00,0x00,0x00,0x00]
- vminpbf16 (%rip){1to16}, %ymm23, %ymm22
+ vminbf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vminpbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vminbf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5d,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vminpbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vminbf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vminpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vminbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5d,0x71,0x7f]
- vminpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vminbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vminpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vminbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5d,0x72,0x80]
- vminpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vminbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vminpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vminbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vminpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vminbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vminpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vminbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00]
- vminpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vminbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vminpbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vminbf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5d,0x35,0x00,0x00,0x00,0x00]
- vminpbf16 (%rip){1to8}, %xmm23, %xmm22
+ vminbf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vminpbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vminbf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5d,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vminpbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vminbf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vminpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vminbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5d,0x71,0x7f]
- vminpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vminbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vminpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vminbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5d,0x72,0x80]
- vminpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vminbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vmulnepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vmulbf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x85,0x45,0x20,0x59,0xf0]
- vmulnepbf16 %ymm24, %ymm23, %ymm22
+ vmulbf16 %ymm24, %ymm23, %ymm22
-// CHECK: vmulnepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vmulbf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x27,0x59,0xf0]
- vmulnepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vmulbf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vmulnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vmulbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0xa7,0x59,0xf0]
- vmulnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vmulbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vmulnepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vmulbf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x85,0x45,0x40,0x59,0xf0]
- vmulnepbf16 %zmm24, %zmm23, %zmm22
+ vmulbf16 %zmm24, %zmm23, %zmm22
-// CHECK: vmulnepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vmulbf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x47,0x59,0xf0]
- vmulnepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vmulbf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vmulnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vmulbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0xc7,0x59,0xf0]
- vmulnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vmulbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vmulnepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vmulbf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x85,0x45,0x00,0x59,0xf0]
- vmulnepbf16 %xmm24, %xmm23, %xmm22
+ vmulbf16 %xmm24, %xmm23, %xmm22
-// CHECK: vmulnepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vmulbf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x07,0x59,0xf0]
- vmulnepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vmulbf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vmulnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vmulbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0x87,0x59,0xf0]
- vmulnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vmulbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vmulnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vmulbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa5,0x45,0x40,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vmulnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vmulbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vmulnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vmulbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x47,0x59,0xb4,0x80,0x23,0x01,0x00,0x00]
- vmulnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vmulbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vmulnepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vmulbf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x50,0x59,0x35,0x00,0x00,0x00,0x00]
- vmulnepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vmulbf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vmulnepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vmulbf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x40,0x59,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vmulnepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vmulbf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vmulnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vmulbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x59,0x71,0x7f]
- vmulnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vmulbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vmulnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vmulbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x59,0x72,0x80]
- vmulnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vmulbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vmulnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vmulbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa5,0x45,0x20,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vmulnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vmulbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vmulnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vmulbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x27,0x59,0xb4,0x80,0x23,0x01,0x00,0x00]
- vmulnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vmulbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vmulnepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vmulbf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe5,0x45,0x30,0x59,0x35,0x00,0x00,0x00,0x00]
- vmulnepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vmulbf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vmulnepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vmulbf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe5,0x45,0x20,0x59,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vmulnepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vmulbf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vmulnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vmulbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x59,0x71,0x7f]
- vmulnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vmulbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vmulnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vmulbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x59,0x72,0x80]
- vmulnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vmulbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vmulnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vmulbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa5,0x45,0x00,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vmulnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vmulbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vmulnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vmulbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x07,0x59,0xb4,0x80,0x23,0x01,0x00,0x00]
- vmulnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vmulbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vmulnepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vmulbf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x10,0x59,0x35,0x00,0x00,0x00,0x00]
- vmulnepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vmulbf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vmulnepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vmulbf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x00,0x59,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vmulnepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vmulbf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vmulnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vmulbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0x87,0x59,0x71,0x7f]
- vmulnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vmulbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vmulnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vmulbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0x97,0x59,0x72,0x80]
- vmulnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vmulbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vrcppbf16 %xmm23, %xmm22
+// CHECK: vrcpbf16 %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4c,0xf7]
- vrcppbf16 %xmm23, %xmm22
+ vrcpbf16 %xmm23, %xmm22
-// CHECK: vrcppbf16 %xmm23, %xmm22 {%k7}
+// CHECK: vrcpbf16 %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xa6,0x7c,0x0f,0x4c,0xf7]
- vrcppbf16 %xmm23, %xmm22 {%k7}
+ vrcpbf16 %xmm23, %xmm22 {%k7}
-// CHECK: vrcppbf16 %xmm23, %xmm22 {%k7} {z}
+// CHECK: vrcpbf16 %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa6,0x7c,0x8f,0x4c,0xf7]
- vrcppbf16 %xmm23, %xmm22 {%k7} {z}
+ vrcpbf16 %xmm23, %xmm22 {%k7} {z}
-// CHECK: vrcppbf16 %zmm23, %zmm22
+// CHECK: vrcpbf16 %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4c,0xf7]
- vrcppbf16 %zmm23, %zmm22
+ vrcpbf16 %zmm23, %zmm22
-// CHECK: vrcppbf16 %zmm23, %zmm22 {%k7}
+// CHECK: vrcpbf16 %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xa6,0x7c,0x4f,0x4c,0xf7]
- vrcppbf16 %zmm23, %zmm22 {%k7}
+ vrcpbf16 %zmm23, %zmm22 {%k7}
-// CHECK: vrcppbf16 %zmm23, %zmm22 {%k7} {z}
+// CHECK: vrcpbf16 %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa6,0x7c,0xcf,0x4c,0xf7]
- vrcppbf16 %zmm23, %zmm22 {%k7} {z}
+ vrcpbf16 %zmm23, %zmm22 {%k7} {z}
-// CHECK: vrcppbf16 %ymm23, %ymm22
+// CHECK: vrcpbf16 %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4c,0xf7]
- vrcppbf16 %ymm23, %ymm22
+ vrcpbf16 %ymm23, %ymm22
-// CHECK: vrcppbf16 %ymm23, %ymm22 {%k7}
+// CHECK: vrcpbf16 %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xa6,0x7c,0x2f,0x4c,0xf7]
- vrcppbf16 %ymm23, %ymm22 {%k7}
+ vrcpbf16 %ymm23, %ymm22 {%k7}
-// CHECK: vrcppbf16 %ymm23, %ymm22 {%k7} {z}
+// CHECK: vrcpbf16 %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa6,0x7c,0xaf,0x4c,0xf7]
- vrcppbf16 %ymm23, %ymm22 {%k7} {z}
+ vrcpbf16 %ymm23, %ymm22 {%k7} {z}
-// CHECK: vrcppbf16 268435456(%rbp,%r14,8), %xmm22
+// CHECK: vrcpbf16 268435456(%rbp,%r14,8), %xmm22
// CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vrcppbf16 268435456(%rbp,%r14,8), %xmm22
+ vrcpbf16 268435456(%rbp,%r14,8), %xmm22
-// CHECK: vrcppbf16 291(%r8,%rax,4), %xmm22 {%k7}
+// CHECK: vrcpbf16 291(%r8,%rax,4), %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x7c,0x0f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vrcppbf16 291(%r8,%rax,4), %xmm22 {%k7}
+ vrcpbf16 291(%r8,%rax,4), %xmm22 {%k7}
-// CHECK: vrcppbf16 (%rip){1to8}, %xmm22
+// CHECK: vrcpbf16 (%rip){1to8}, %xmm22
// CHECK: encoding: [0x62,0xe6,0x7c,0x18,0x4c,0x35,0x00,0x00,0x00,0x00]
- vrcppbf16 (%rip){1to8}, %xmm22
+ vrcpbf16 (%rip){1to8}, %xmm22
-// CHECK: vrcppbf16 -512(,%rbp,2), %xmm22
+// CHECK: vrcpbf16 -512(,%rbp,2), %xmm22
// CHECK: encoding: [0x62,0xe6,0x7c,0x08,0x4c,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vrcppbf16 -512(,%rbp,2), %xmm22
+ vrcpbf16 -512(,%rbp,2), %xmm22
-// CHECK: vrcppbf16 2032(%rcx), %xmm22 {%k7} {z}
+// CHECK: vrcpbf16 2032(%rcx), %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x7c,0x8f,0x4c,0x71,0x7f]
- vrcppbf16 2032(%rcx), %xmm22 {%k7} {z}
+ vrcpbf16 2032(%rcx), %xmm22 {%k7} {z}
-// CHECK: vrcppbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
+// CHECK: vrcpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x7c,0x9f,0x4c,0x72,0x80]
- vrcppbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
+ vrcpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
-// CHECK: vrcppbf16 268435456(%rbp,%r14,8), %ymm22
+// CHECK: vrcpbf16 268435456(%rbp,%r14,8), %ymm22
// CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vrcppbf16 268435456(%rbp,%r14,8), %ymm22
+ vrcpbf16 268435456(%rbp,%r14,8), %ymm22
-// CHECK: vrcppbf16 291(%r8,%rax,4), %ymm22 {%k7}
+// CHECK: vrcpbf16 291(%r8,%rax,4), %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x7c,0x2f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vrcppbf16 291(%r8,%rax,4), %ymm22 {%k7}
+ vrcpbf16 291(%r8,%rax,4), %ymm22 {%k7}
-// CHECK: vrcppbf16 (%rip){1to16}, %ymm22
+// CHECK: vrcpbf16 (%rip){1to16}, %ymm22
// CHECK: encoding: [0x62,0xe6,0x7c,0x38,0x4c,0x35,0x00,0x00,0x00,0x00]
- vrcppbf16 (%rip){1to16}, %ymm22
+ vrcpbf16 (%rip){1to16}, %ymm22
-// CHECK: vrcppbf16 -1024(,%rbp,2), %ymm22
+// CHECK: vrcpbf16 -1024(,%rbp,2), %ymm22
// CHECK: encoding: [0x62,0xe6,0x7c,0x28,0x4c,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vrcppbf16 -1024(,%rbp,2), %ymm22
+ vrcpbf16 -1024(,%rbp,2), %ymm22
-// CHECK: vrcppbf16 4064(%rcx), %ymm22 {%k7} {z}
+// CHECK: vrcpbf16 4064(%rcx), %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x7c,0xaf,0x4c,0x71,0x7f]
- vrcppbf16 4064(%rcx), %ymm22 {%k7} {z}
+ vrcpbf16 4064(%rcx), %ymm22 {%k7} {z}
-// CHECK: vrcppbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
+// CHECK: vrcpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x7c,0xbf,0x4c,0x72,0x80]
- vrcppbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
+ vrcpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
-// CHECK: vrcppbf16 268435456(%rbp,%r14,8), %zmm22
+// CHECK: vrcpbf16 268435456(%rbp,%r14,8), %zmm22
// CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vrcppbf16 268435456(%rbp,%r14,8), %zmm22
+ vrcpbf16 268435456(%rbp,%r14,8), %zmm22
-// CHECK: vrcppbf16 291(%r8,%rax,4), %zmm22 {%k7}
+// CHECK: vrcpbf16 291(%r8,%rax,4), %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x7c,0x4f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vrcppbf16 291(%r8,%rax,4), %zmm22 {%k7}
+ vrcpbf16 291(%r8,%rax,4), %zmm22 {%k7}
-// CHECK: vrcppbf16 (%rip){1to32}, %zmm22
+// CHECK: vrcpbf16 (%rip){1to32}, %zmm22
// CHECK: encoding: [0x62,0xe6,0x7c,0x58,0x4c,0x35,0x00,0x00,0x00,0x00]
- vrcppbf16 (%rip){1to32}, %zmm22
+ vrcpbf16 (%rip){1to32}, %zmm22
-// CHECK: vrcppbf16 -2048(,%rbp,2), %zmm22
+// CHECK: vrcpbf16 -2048(,%rbp,2), %zmm22
// CHECK: encoding: [0x62,0xe6,0x7c,0x48,0x4c,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vrcppbf16 -2048(,%rbp,2), %zmm22
+ vrcpbf16 -2048(,%rbp,2), %zmm22
-// CHECK: vrcppbf16 8128(%rcx), %zmm22 {%k7} {z}
+// CHECK: vrcpbf16 8128(%rcx), %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x7c,0xcf,0x4c,0x71,0x7f]
- vrcppbf16 8128(%rcx), %zmm22 {%k7} {z}
+ vrcpbf16 8128(%rcx), %zmm22 {%k7} {z}
-// CHECK: vrcppbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
+// CHECK: vrcpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x7c,0xdf,0x4c,0x72,0x80]
- vrcppbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
+ vrcpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
-// CHECK: vreducenepbf16 $123, %zmm23, %zmm22
+// CHECK: vreducebf16 $123, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x56,0xf7,0x7b]
- vreducenepbf16 $123, %zmm23, %zmm22
+ vreducebf16 $123, %zmm23, %zmm22
-// CHECK: vreducenepbf16 $123, %zmm23, %zmm22 {%k7}
+// CHECK: vreducebf16 $123, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xa3,0x7f,0x4f,0x56,0xf7,0x7b]
- vreducenepbf16 $123, %zmm23, %zmm22 {%k7}
+ vreducebf16 $123, %zmm23, %zmm22 {%k7}
-// CHECK: vreducenepbf16 $123, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vreducebf16 $123, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa3,0x7f,0xcf,0x56,0xf7,0x7b]
- vreducenepbf16 $123, %zmm23, %zmm22 {%k7} {z}
+ vreducebf16 $123, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vreducenepbf16 $123, %ymm23, %ymm22
+// CHECK: vreducebf16 $123, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x56,0xf7,0x7b]
- vreducenepbf16 $123, %ymm23, %ymm22
+ vreducebf16 $123, %ymm23, %ymm22
-// CHECK: vreducenepbf16 $123, %ymm23, %ymm22 {%k7}
+// CHECK: vreducebf16 $123, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xa3,0x7f,0x2f,0x56,0xf7,0x7b]
- vreducenepbf16 $123, %ymm23, %ymm22 {%k7}
+ vreducebf16 $123, %ymm23, %ymm22 {%k7}
-// CHECK: vreducenepbf16 $123, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vreducebf16 $123, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa3,0x7f,0xaf,0x56,0xf7,0x7b]
- vreducenepbf16 $123, %ymm23, %ymm22 {%k7} {z}
+ vreducebf16 $123, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vreducenepbf16 $123, %xmm23, %xmm22
+// CHECK: vreducebf16 $123, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x56,0xf7,0x7b]
- vreducenepbf16 $123, %xmm23, %xmm22
+ vreducebf16 $123, %xmm23, %xmm22
-// CHECK: vreducenepbf16 $123, %xmm23, %xmm22 {%k7}
+// CHECK: vreducebf16 $123, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xa3,0x7f,0x0f,0x56,0xf7,0x7b]
- vreducenepbf16 $123, %xmm23, %xmm22 {%k7}
+ vreducebf16 $123, %xmm23, %xmm22 {%k7}
-// CHECK: vreducenepbf16 $123, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vreducebf16 $123, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa3,0x7f,0x8f,0x56,0xf7,0x7b]
- vreducenepbf16 $123, %xmm23, %xmm22 {%k7} {z}
+ vreducebf16 $123, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vreducenepbf16 $123, 268435456(%rbp,%r14,8), %xmm22
+// CHECK: vreducebf16 $123, 268435456(%rbp,%r14,8), %xmm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vreducenepbf16 $123, 268435456(%rbp,%r14,8), %xmm22
+ vreducebf16 $123, 268435456(%rbp,%r14,8), %xmm22
-// CHECK: vreducenepbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
+// CHECK: vreducebf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc3,0x7f,0x0f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vreducenepbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
+ vreducebf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
-// CHECK: vreducenepbf16 $123, (%rip){1to8}, %xmm22
+// CHECK: vreducebf16 $123, (%rip){1to8}, %xmm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x18,0x56,0x35,0x00,0x00,0x00,0x00,0x7b]
- vreducenepbf16 $123, (%rip){1to8}, %xmm22
+ vreducebf16 $123, (%rip){1to8}, %xmm22
-// CHECK: vreducenepbf16 $123, -512(,%rbp,2), %xmm22
+// CHECK: vreducebf16 $123, -512(,%rbp,2), %xmm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x08,0x56,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vreducenepbf16 $123, -512(,%rbp,2), %xmm22
+ vreducebf16 $123, -512(,%rbp,2), %xmm22
-// CHECK: vreducenepbf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
+// CHECK: vreducebf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0x8f,0x56,0x71,0x7f,0x7b]
- vreducenepbf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
+ vreducebf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
-// CHECK: vreducenepbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
+// CHECK: vreducebf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0x9f,0x56,0x72,0x80,0x7b]
- vreducenepbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
+ vreducebf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
-// CHECK: vreducenepbf16 $123, 268435456(%rbp,%r14,8), %ymm22
+// CHECK: vreducebf16 $123, 268435456(%rbp,%r14,8), %ymm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vreducenepbf16 $123, 268435456(%rbp,%r14,8), %ymm22
+ vreducebf16 $123, 268435456(%rbp,%r14,8), %ymm22
-// CHECK: vreducenepbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
+// CHECK: vreducebf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc3,0x7f,0x2f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vreducenepbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
+ vreducebf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
-// CHECK: vreducenepbf16 $123, (%rip){1to16}, %ymm22
+// CHECK: vreducebf16 $123, (%rip){1to16}, %ymm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x38,0x56,0x35,0x00,0x00,0x00,0x00,0x7b]
- vreducenepbf16 $123, (%rip){1to16}, %ymm22
+ vreducebf16 $123, (%rip){1to16}, %ymm22
-// CHECK: vreducenepbf16 $123, -1024(,%rbp,2), %ymm22
+// CHECK: vreducebf16 $123, -1024(,%rbp,2), %ymm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x28,0x56,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vreducenepbf16 $123, -1024(,%rbp,2), %ymm22
+ vreducebf16 $123, -1024(,%rbp,2), %ymm22
-// CHECK: vreducenepbf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
+// CHECK: vreducebf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0xaf,0x56,0x71,0x7f,0x7b]
- vreducenepbf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
+ vreducebf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
-// CHECK: vreducenepbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
+// CHECK: vreducebf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0xbf,0x56,0x72,0x80,0x7b]
- vreducenepbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
+ vreducebf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
-// CHECK: vreducenepbf16 $123, 268435456(%rbp,%r14,8), %zmm22
+// CHECK: vreducebf16 $123, 268435456(%rbp,%r14,8), %zmm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vreducenepbf16 $123, 268435456(%rbp,%r14,8), %zmm22
+ vreducebf16 $123, 268435456(%rbp,%r14,8), %zmm22
-// CHECK: vreducenepbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
+// CHECK: vreducebf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc3,0x7f,0x4f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vreducenepbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
+ vreducebf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
-// CHECK: vreducenepbf16 $123, (%rip){1to32}, %zmm22
+// CHECK: vreducebf16 $123, (%rip){1to32}, %zmm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x58,0x56,0x35,0x00,0x00,0x00,0x00,0x7b]
- vreducenepbf16 $123, (%rip){1to32}, %zmm22
+ vreducebf16 $123, (%rip){1to32}, %zmm22
-// CHECK: vreducenepbf16 $123, -2048(,%rbp,2), %zmm22
+// CHECK: vreducebf16 $123, -2048(,%rbp,2), %zmm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x48,0x56,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vreducenepbf16 $123, -2048(,%rbp,2), %zmm22
+ vreducebf16 $123, -2048(,%rbp,2), %zmm22
-// CHECK: vreducenepbf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
+// CHECK: vreducebf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0xcf,0x56,0x71,0x7f,0x7b]
- vreducenepbf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
+ vreducebf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
-// CHECK: vreducenepbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
+// CHECK: vreducebf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0xdf,0x56,0x72,0x80,0x7b]
- vreducenepbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
+ vreducebf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, %zmm23, %zmm22
+// CHECK: vrndscalebf16 $123, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x08,0xf7,0x7b]
- vrndscalenepbf16 $123, %zmm23, %zmm22
+ vrndscalebf16 $123, %zmm23, %zmm22
-// CHECK: vrndscalenepbf16 $123, %zmm23, %zmm22 {%k7}
+// CHECK: vrndscalebf16 $123, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xa3,0x7f,0x4f,0x08,0xf7,0x7b]
- vrndscalenepbf16 $123, %zmm23, %zmm22 {%k7}
+ vrndscalebf16 $123, %zmm23, %zmm22 {%k7}
-// CHECK: vrndscalenepbf16 $123, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vrndscalebf16 $123, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa3,0x7f,0xcf,0x08,0xf7,0x7b]
- vrndscalenepbf16 $123, %zmm23, %zmm22 {%k7} {z}
+ vrndscalebf16 $123, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, %ymm23, %ymm22
+// CHECK: vrndscalebf16 $123, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x08,0xf7,0x7b]
- vrndscalenepbf16 $123, %ymm23, %ymm22
+ vrndscalebf16 $123, %ymm23, %ymm22
-// CHECK: vrndscalenepbf16 $123, %ymm23, %ymm22 {%k7}
+// CHECK: vrndscalebf16 $123, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xa3,0x7f,0x2f,0x08,0xf7,0x7b]
- vrndscalenepbf16 $123, %ymm23, %ymm22 {%k7}
+ vrndscalebf16 $123, %ymm23, %ymm22 {%k7}
-// CHECK: vrndscalenepbf16 $123, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vrndscalebf16 $123, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa3,0x7f,0xaf,0x08,0xf7,0x7b]
- vrndscalenepbf16 $123, %ymm23, %ymm22 {%k7} {z}
+ vrndscalebf16 $123, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, %xmm23, %xmm22
+// CHECK: vrndscalebf16 $123, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x08,0xf7,0x7b]
- vrndscalenepbf16 $123, %xmm23, %xmm22
+ vrndscalebf16 $123, %xmm23, %xmm22
-// CHECK: vrndscalenepbf16 $123, %xmm23, %xmm22 {%k7}
+// CHECK: vrndscalebf16 $123, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xa3,0x7f,0x0f,0x08,0xf7,0x7b]
- vrndscalenepbf16 $123, %xmm23, %xmm22 {%k7}
+ vrndscalebf16 $123, %xmm23, %xmm22 {%k7}
-// CHECK: vrndscalenepbf16 $123, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vrndscalebf16 $123, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa3,0x7f,0x8f,0x08,0xf7,0x7b]
- vrndscalenepbf16 $123, %xmm23, %xmm22 {%k7} {z}
+ vrndscalebf16 $123, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %xmm22
+// CHECK: vrndscalebf16 $123, 268435456(%rbp,%r14,8), %xmm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %xmm22
+ vrndscalebf16 $123, 268435456(%rbp,%r14,8), %xmm22
-// CHECK: vrndscalenepbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
+// CHECK: vrndscalebf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc3,0x7f,0x0f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vrndscalenepbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
+ vrndscalebf16 $123, 291(%r8,%rax,4), %xmm22 {%k7}
-// CHECK: vrndscalenepbf16 $123, (%rip){1to8}, %xmm22
+// CHECK: vrndscalebf16 $123, (%rip){1to8}, %xmm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x18,0x08,0x35,0x00,0x00,0x00,0x00,0x7b]
- vrndscalenepbf16 $123, (%rip){1to8}, %xmm22
+ vrndscalebf16 $123, (%rip){1to8}, %xmm22
-// CHECK: vrndscalenepbf16 $123, -512(,%rbp,2), %xmm22
+// CHECK: vrndscalebf16 $123, -512(,%rbp,2), %xmm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x08,0x08,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vrndscalenepbf16 $123, -512(,%rbp,2), %xmm22
+ vrndscalebf16 $123, -512(,%rbp,2), %xmm22
-// CHECK: vrndscalenepbf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
+// CHECK: vrndscalebf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0x8f,0x08,0x71,0x7f,0x7b]
- vrndscalenepbf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
+ vrndscalebf16 $123, 2032(%rcx), %xmm22 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
+// CHECK: vrndscalebf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0x9f,0x08,0x72,0x80,0x7b]
- vrndscalenepbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
+ vrndscalebf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %ymm22
+// CHECK: vrndscalebf16 $123, 268435456(%rbp,%r14,8), %ymm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %ymm22
+ vrndscalebf16 $123, 268435456(%rbp,%r14,8), %ymm22
-// CHECK: vrndscalenepbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
+// CHECK: vrndscalebf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc3,0x7f,0x2f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vrndscalenepbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
+ vrndscalebf16 $123, 291(%r8,%rax,4), %ymm22 {%k7}
-// CHECK: vrndscalenepbf16 $123, (%rip){1to16}, %ymm22
+// CHECK: vrndscalebf16 $123, (%rip){1to16}, %ymm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x38,0x08,0x35,0x00,0x00,0x00,0x00,0x7b]
- vrndscalenepbf16 $123, (%rip){1to16}, %ymm22
+ vrndscalebf16 $123, (%rip){1to16}, %ymm22
-// CHECK: vrndscalenepbf16 $123, -1024(,%rbp,2), %ymm22
+// CHECK: vrndscalebf16 $123, -1024(,%rbp,2), %ymm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x28,0x08,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vrndscalenepbf16 $123, -1024(,%rbp,2), %ymm22
+ vrndscalebf16 $123, -1024(,%rbp,2), %ymm22
-// CHECK: vrndscalenepbf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
+// CHECK: vrndscalebf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0xaf,0x08,0x71,0x7f,0x7b]
- vrndscalenepbf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
+ vrndscalebf16 $123, 4064(%rcx), %ymm22 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
+// CHECK: vrndscalebf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0xbf,0x08,0x72,0x80,0x7b]
- vrndscalenepbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
+ vrndscalebf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %zmm22
+// CHECK: vrndscalebf16 $123, 268435456(%rbp,%r14,8), %zmm22
// CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %zmm22
+ vrndscalebf16 $123, 268435456(%rbp,%r14,8), %zmm22
-// CHECK: vrndscalenepbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
+// CHECK: vrndscalebf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc3,0x7f,0x4f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vrndscalenepbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
+ vrndscalebf16 $123, 291(%r8,%rax,4), %zmm22 {%k7}
-// CHECK: vrndscalenepbf16 $123, (%rip){1to32}, %zmm22
+// CHECK: vrndscalebf16 $123, (%rip){1to32}, %zmm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x58,0x08,0x35,0x00,0x00,0x00,0x00,0x7b]
- vrndscalenepbf16 $123, (%rip){1to32}, %zmm22
+ vrndscalebf16 $123, (%rip){1to32}, %zmm22
-// CHECK: vrndscalenepbf16 $123, -2048(,%rbp,2), %zmm22
+// CHECK: vrndscalebf16 $123, -2048(,%rbp,2), %zmm22
// CHECK: encoding: [0x62,0xe3,0x7f,0x48,0x08,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vrndscalenepbf16 $123, -2048(,%rbp,2), %zmm22
+ vrndscalebf16 $123, -2048(,%rbp,2), %zmm22
-// CHECK: vrndscalenepbf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
+// CHECK: vrndscalebf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0xcf,0x08,0x71,0x7f,0x7b]
- vrndscalenepbf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
+ vrndscalebf16 $123, 8128(%rcx), %zmm22 {%k7} {z}
-// CHECK: vrndscalenepbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
+// CHECK: vrndscalebf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe3,0x7f,0xdf,0x08,0x72,0x80,0x7b]
- vrndscalenepbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
+ vrndscalebf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z}
-// CHECK: vrsqrtpbf16 %xmm23, %xmm22
+// CHECK: vrsqrtbf16 %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4e,0xf7]
- vrsqrtpbf16 %xmm23, %xmm22
+ vrsqrtbf16 %xmm23, %xmm22
-// CHECK: vrsqrtpbf16 %xmm23, %xmm22 {%k7}
+// CHECK: vrsqrtbf16 %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xa6,0x7c,0x0f,0x4e,0xf7]
- vrsqrtpbf16 %xmm23, %xmm22 {%k7}
+ vrsqrtbf16 %xmm23, %xmm22 {%k7}
-// CHECK: vrsqrtpbf16 %xmm23, %xmm22 {%k7} {z}
+// CHECK: vrsqrtbf16 %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa6,0x7c,0x8f,0x4e,0xf7]
- vrsqrtpbf16 %xmm23, %xmm22 {%k7} {z}
+ vrsqrtbf16 %xmm23, %xmm22 {%k7} {z}
-// CHECK: vrsqrtpbf16 %zmm23, %zmm22
+// CHECK: vrsqrtbf16 %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4e,0xf7]
- vrsqrtpbf16 %zmm23, %zmm22
+ vrsqrtbf16 %zmm23, %zmm22
-// CHECK: vrsqrtpbf16 %zmm23, %zmm22 {%k7}
+// CHECK: vrsqrtbf16 %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xa6,0x7c,0x4f,0x4e,0xf7]
- vrsqrtpbf16 %zmm23, %zmm22 {%k7}
+ vrsqrtbf16 %zmm23, %zmm22 {%k7}
-// CHECK: vrsqrtpbf16 %zmm23, %zmm22 {%k7} {z}
+// CHECK: vrsqrtbf16 %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa6,0x7c,0xcf,0x4e,0xf7]
- vrsqrtpbf16 %zmm23, %zmm22 {%k7} {z}
+ vrsqrtbf16 %zmm23, %zmm22 {%k7} {z}
-// CHECK: vrsqrtpbf16 %ymm23, %ymm22
+// CHECK: vrsqrtbf16 %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4e,0xf7]
- vrsqrtpbf16 %ymm23, %ymm22
+ vrsqrtbf16 %ymm23, %ymm22
-// CHECK: vrsqrtpbf16 %ymm23, %ymm22 {%k7}
+// CHECK: vrsqrtbf16 %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xa6,0x7c,0x2f,0x4e,0xf7]
- vrsqrtpbf16 %ymm23, %ymm22 {%k7}
+ vrsqrtbf16 %ymm23, %ymm22 {%k7}
-// CHECK: vrsqrtpbf16 %ymm23, %ymm22 {%k7} {z}
+// CHECK: vrsqrtbf16 %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa6,0x7c,0xaf,0x4e,0xf7]
- vrsqrtpbf16 %ymm23, %ymm22 {%k7} {z}
+ vrsqrtbf16 %ymm23, %ymm22 {%k7} {z}
-// CHECK: vrsqrtpbf16 268435456(%rbp,%r14,8), %xmm22
+// CHECK: vrsqrtbf16 268435456(%rbp,%r14,8), %xmm22
// CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vrsqrtpbf16 268435456(%rbp,%r14,8), %xmm22
+ vrsqrtbf16 268435456(%rbp,%r14,8), %xmm22
-// CHECK: vrsqrtpbf16 291(%r8,%rax,4), %xmm22 {%k7}
+// CHECK: vrsqrtbf16 291(%r8,%rax,4), %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x7c,0x0f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vrsqrtpbf16 291(%r8,%rax,4), %xmm22 {%k7}
+ vrsqrtbf16 291(%r8,%rax,4), %xmm22 {%k7}
-// CHECK: vrsqrtpbf16 (%rip){1to8}, %xmm22
+// CHECK: vrsqrtbf16 (%rip){1to8}, %xmm22
// CHECK: encoding: [0x62,0xe6,0x7c,0x18,0x4e,0x35,0x00,0x00,0x00,0x00]
- vrsqrtpbf16 (%rip){1to8}, %xmm22
+ vrsqrtbf16 (%rip){1to8}, %xmm22
-// CHECK: vrsqrtpbf16 -512(,%rbp,2), %xmm22
+// CHECK: vrsqrtbf16 -512(,%rbp,2), %xmm22
// CHECK: encoding: [0x62,0xe6,0x7c,0x08,0x4e,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vrsqrtpbf16 -512(,%rbp,2), %xmm22
+ vrsqrtbf16 -512(,%rbp,2), %xmm22
-// CHECK: vrsqrtpbf16 2032(%rcx), %xmm22 {%k7} {z}
+// CHECK: vrsqrtbf16 2032(%rcx), %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x7c,0x8f,0x4e,0x71,0x7f]
- vrsqrtpbf16 2032(%rcx), %xmm22 {%k7} {z}
+ vrsqrtbf16 2032(%rcx), %xmm22 {%k7} {z}
-// CHECK: vrsqrtpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
+// CHECK: vrsqrtbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x7c,0x9f,0x4e,0x72,0x80]
- vrsqrtpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
+ vrsqrtbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
-// CHECK: vrsqrtpbf16 268435456(%rbp,%r14,8), %ymm22
+// CHECK: vrsqrtbf16 268435456(%rbp,%r14,8), %ymm22
// CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vrsqrtpbf16 268435456(%rbp,%r14,8), %ymm22
+ vrsqrtbf16 268435456(%rbp,%r14,8), %ymm22
-// CHECK: vrsqrtpbf16 291(%r8,%rax,4), %ymm22 {%k7}
+// CHECK: vrsqrtbf16 291(%r8,%rax,4), %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x7c,0x2f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vrsqrtpbf16 291(%r8,%rax,4), %ymm22 {%k7}
+ vrsqrtbf16 291(%r8,%rax,4), %ymm22 {%k7}
-// CHECK: vrsqrtpbf16 (%rip){1to16}, %ymm22
+// CHECK: vrsqrtbf16 (%rip){1to16}, %ymm22
// CHECK: encoding: [0x62,0xe6,0x7c,0x38,0x4e,0x35,0x00,0x00,0x00,0x00]
- vrsqrtpbf16 (%rip){1to16}, %ymm22
+ vrsqrtbf16 (%rip){1to16}, %ymm22
-// CHECK: vrsqrtpbf16 -1024(,%rbp,2), %ymm22
+// CHECK: vrsqrtbf16 -1024(,%rbp,2), %ymm22
// CHECK: encoding: [0x62,0xe6,0x7c,0x28,0x4e,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vrsqrtpbf16 -1024(,%rbp,2), %ymm22
+ vrsqrtbf16 -1024(,%rbp,2), %ymm22
-// CHECK: vrsqrtpbf16 4064(%rcx), %ymm22 {%k7} {z}
+// CHECK: vrsqrtbf16 4064(%rcx), %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x7c,0xaf,0x4e,0x71,0x7f]
- vrsqrtpbf16 4064(%rcx), %ymm22 {%k7} {z}
+ vrsqrtbf16 4064(%rcx), %ymm22 {%k7} {z}
-// CHECK: vrsqrtpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
+// CHECK: vrsqrtbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x7c,0xbf,0x4e,0x72,0x80]
- vrsqrtpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
+ vrsqrtbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
-// CHECK: vrsqrtpbf16 268435456(%rbp,%r14,8), %zmm22
+// CHECK: vrsqrtbf16 268435456(%rbp,%r14,8), %zmm22
// CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vrsqrtpbf16 268435456(%rbp,%r14,8), %zmm22
+ vrsqrtbf16 268435456(%rbp,%r14,8), %zmm22
-// CHECK: vrsqrtpbf16 291(%r8,%rax,4), %zmm22 {%k7}
+// CHECK: vrsqrtbf16 291(%r8,%rax,4), %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x7c,0x4f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vrsqrtpbf16 291(%r8,%rax,4), %zmm22 {%k7}
+ vrsqrtbf16 291(%r8,%rax,4), %zmm22 {%k7}
-// CHECK: vrsqrtpbf16 (%rip){1to32}, %zmm22
+// CHECK: vrsqrtbf16 (%rip){1to32}, %zmm22
// CHECK: encoding: [0x62,0xe6,0x7c,0x58,0x4e,0x35,0x00,0x00,0x00,0x00]
- vrsqrtpbf16 (%rip){1to32}, %zmm22
+ vrsqrtbf16 (%rip){1to32}, %zmm22
-// CHECK: vrsqrtpbf16 -2048(,%rbp,2), %zmm22
+// CHECK: vrsqrtbf16 -2048(,%rbp,2), %zmm22
// CHECK: encoding: [0x62,0xe6,0x7c,0x48,0x4e,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vrsqrtpbf16 -2048(,%rbp,2), %zmm22
+ vrsqrtbf16 -2048(,%rbp,2), %zmm22
-// CHECK: vrsqrtpbf16 8128(%rcx), %zmm22 {%k7} {z}
+// CHECK: vrsqrtbf16 8128(%rcx), %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x7c,0xcf,0x4e,0x71,0x7f]
- vrsqrtpbf16 8128(%rcx), %zmm22 {%k7} {z}
+ vrsqrtbf16 8128(%rcx), %zmm22 {%k7} {z}
-// CHECK: vrsqrtpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
+// CHECK: vrsqrtbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x7c,0xdf,0x4e,0x72,0x80]
- vrsqrtpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
+ vrsqrtbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
-// CHECK: vscalefpbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vscalefbf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x86,0x44,0x20,0x2c,0xf0]
- vscalefpbf16 %ymm24, %ymm23, %ymm22
+ vscalefbf16 %ymm24, %ymm23, %ymm22
-// CHECK: vscalefpbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vscalefbf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x27,0x2c,0xf0]
- vscalefpbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vscalefbf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vscalefpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vscalefbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0x2c,0xf0]
- vscalefpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vscalefbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vscalefpbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vscalefbf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x86,0x44,0x40,0x2c,0xf0]
- vscalefpbf16 %zmm24, %zmm23, %zmm22
+ vscalefbf16 %zmm24, %zmm23, %zmm22
-// CHECK: vscalefpbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vscalefbf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x47,0x2c,0xf0]
- vscalefpbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vscalefbf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vscalefpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vscalefbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0x2c,0xf0]
- vscalefpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vscalefbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vscalefpbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vscalefbf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x86,0x44,0x00,0x2c,0xf0]
- vscalefpbf16 %xmm24, %xmm23, %xmm22
+ vscalefbf16 %xmm24, %xmm23, %xmm22
-// CHECK: vscalefpbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vscalefbf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x86,0x44,0x07,0x2c,0xf0]
- vscalefpbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vscalefbf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vscalefpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vscalefbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x86,0x44,0x87,0x2c,0xf0]
- vscalefpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vscalefbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vscalefpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vscalefbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vscalefpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vscalefbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vscalefpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vscalefbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vscalefpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vscalefbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vscalefpbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vscalefbf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0x2c,0x35,0x00,0x00,0x00,0x00]
- vscalefpbf16 (%rip){1to32}, %zmm23, %zmm22
+ vscalefbf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vscalefpbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vscalefbf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0x2c,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vscalefpbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vscalefbf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vscalefpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vscalefbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x2c,0x71,0x7f]
- vscalefpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vscalefbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vscalefpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vscalefbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x2c,0x72,0x80]
- vscalefpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vscalefbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vscalefpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vscalefbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vscalefpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vscalefbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vscalefpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vscalefbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vscalefpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vscalefbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vscalefpbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vscalefbf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0x2c,0x35,0x00,0x00,0x00,0x00]
- vscalefpbf16 (%rip){1to16}, %ymm23, %ymm22
+ vscalefbf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vscalefpbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vscalefbf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0x2c,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vscalefpbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vscalefbf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vscalefpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vscalefbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x2c,0x71,0x7f]
- vscalefpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vscalefbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vscalefpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vscalefbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x2c,0x72,0x80]
- vscalefpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vscalefbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vscalefpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vscalefbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vscalefpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vscalefbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vscalefpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vscalefbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vscalefpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vscalefbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vscalefpbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vscalefbf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0x2c,0x35,0x00,0x00,0x00,0x00]
- vscalefpbf16 (%rip){1to8}, %xmm23, %xmm22
+ vscalefbf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vscalefpbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vscalefbf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0x2c,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vscalefpbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vscalefbf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vscalefpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vscalefbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0x2c,0x71,0x7f]
- vscalefpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vscalefbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vscalefpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vscalefbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0x2c,0x72,0x80]
- vscalefpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vscalefbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vsqrtnepbf16 %xmm23, %xmm22
+// CHECK: vsqrtbf16 %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x51,0xf7]
- vsqrtnepbf16 %xmm23, %xmm22
+ vsqrtbf16 %xmm23, %xmm22
-// CHECK: vsqrtnepbf16 %xmm23, %xmm22 {%k7}
+// CHECK: vsqrtbf16 %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xa5,0x7d,0x0f,0x51,0xf7]
- vsqrtnepbf16 %xmm23, %xmm22 {%k7}
+ vsqrtbf16 %xmm23, %xmm22 {%k7}
-// CHECK: vsqrtnepbf16 %xmm23, %xmm22 {%k7} {z}
+// CHECK: vsqrtbf16 %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa5,0x7d,0x8f,0x51,0xf7]
- vsqrtnepbf16 %xmm23, %xmm22 {%k7} {z}
+ vsqrtbf16 %xmm23, %xmm22 {%k7} {z}
-// CHECK: vsqrtnepbf16 %zmm23, %zmm22
+// CHECK: vsqrtbf16 %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x51,0xf7]
- vsqrtnepbf16 %zmm23, %zmm22
+ vsqrtbf16 %zmm23, %zmm22
-// CHECK: vsqrtnepbf16 %zmm23, %zmm22 {%k7}
+// CHECK: vsqrtbf16 %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xa5,0x7d,0x4f,0x51,0xf7]
- vsqrtnepbf16 %zmm23, %zmm22 {%k7}
+ vsqrtbf16 %zmm23, %zmm22 {%k7}
-// CHECK: vsqrtnepbf16 %zmm23, %zmm22 {%k7} {z}
+// CHECK: vsqrtbf16 %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa5,0x7d,0xcf,0x51,0xf7]
- vsqrtnepbf16 %zmm23, %zmm22 {%k7} {z}
+ vsqrtbf16 %zmm23, %zmm22 {%k7} {z}
-// CHECK: vsqrtnepbf16 %ymm23, %ymm22
+// CHECK: vsqrtbf16 %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x51,0xf7]
- vsqrtnepbf16 %ymm23, %ymm22
+ vsqrtbf16 %ymm23, %ymm22
-// CHECK: vsqrtnepbf16 %ymm23, %ymm22 {%k7}
+// CHECK: vsqrtbf16 %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xa5,0x7d,0x2f,0x51,0xf7]
- vsqrtnepbf16 %ymm23, %ymm22 {%k7}
+ vsqrtbf16 %ymm23, %ymm22 {%k7}
-// CHECK: vsqrtnepbf16 %ymm23, %ymm22 {%k7} {z}
+// CHECK: vsqrtbf16 %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xa5,0x7d,0xaf,0x51,0xf7]
- vsqrtnepbf16 %ymm23, %ymm22 {%k7} {z}
+ vsqrtbf16 %ymm23, %ymm22 {%k7} {z}
-// CHECK: vsqrtnepbf16 268435456(%rbp,%r14,8), %xmm22
+// CHECK: vsqrtbf16 268435456(%rbp,%r14,8), %xmm22
// CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vsqrtnepbf16 268435456(%rbp,%r14,8), %xmm22
+ vsqrtbf16 268435456(%rbp,%r14,8), %xmm22
-// CHECK: vsqrtnepbf16 291(%r8,%rax,4), %xmm22 {%k7}
+// CHECK: vsqrtbf16 291(%r8,%rax,4), %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x7d,0x0f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00]
- vsqrtnepbf16 291(%r8,%rax,4), %xmm22 {%k7}
+ vsqrtbf16 291(%r8,%rax,4), %xmm22 {%k7}
-// CHECK: vsqrtnepbf16 (%rip){1to8}, %xmm22
+// CHECK: vsqrtbf16 (%rip){1to8}, %xmm22
// CHECK: encoding: [0x62,0xe5,0x7d,0x18,0x51,0x35,0x00,0x00,0x00,0x00]
- vsqrtnepbf16 (%rip){1to8}, %xmm22
+ vsqrtbf16 (%rip){1to8}, %xmm22
-// CHECK: vsqrtnepbf16 -512(,%rbp,2), %xmm22
+// CHECK: vsqrtbf16 -512(,%rbp,2), %xmm22
// CHECK: encoding: [0x62,0xe5,0x7d,0x08,0x51,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vsqrtnepbf16 -512(,%rbp,2), %xmm22
+ vsqrtbf16 -512(,%rbp,2), %xmm22
-// CHECK: vsqrtnepbf16 2032(%rcx), %xmm22 {%k7} {z}
+// CHECK: vsqrtbf16 2032(%rcx), %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x7d,0x8f,0x51,0x71,0x7f]
- vsqrtnepbf16 2032(%rcx), %xmm22 {%k7} {z}
+ vsqrtbf16 2032(%rcx), %xmm22 {%k7} {z}
-// CHECK: vsqrtnepbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
+// CHECK: vsqrtbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x7d,0x9f,0x51,0x72,0x80]
- vsqrtnepbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
+ vsqrtbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z}
-// CHECK: vsqrtnepbf16 268435456(%rbp,%r14,8), %ymm22
+// CHECK: vsqrtbf16 268435456(%rbp,%r14,8), %ymm22
// CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vsqrtnepbf16 268435456(%rbp,%r14,8), %ymm22
+ vsqrtbf16 268435456(%rbp,%r14,8), %ymm22
-// CHECK: vsqrtnepbf16 291(%r8,%rax,4), %ymm22 {%k7}
+// CHECK: vsqrtbf16 291(%r8,%rax,4), %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x7d,0x2f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00]
- vsqrtnepbf16 291(%r8,%rax,4), %ymm22 {%k7}
+ vsqrtbf16 291(%r8,%rax,4), %ymm22 {%k7}
-// CHECK: vsqrtnepbf16 (%rip){1to16}, %ymm22
+// CHECK: vsqrtbf16 (%rip){1to16}, %ymm22
// CHECK: encoding: [0x62,0xe5,0x7d,0x38,0x51,0x35,0x00,0x00,0x00,0x00]
- vsqrtnepbf16 (%rip){1to16}, %ymm22
+ vsqrtbf16 (%rip){1to16}, %ymm22
-// CHECK: vsqrtnepbf16 -1024(,%rbp,2), %ymm22
+// CHECK: vsqrtbf16 -1024(,%rbp,2), %ymm22
// CHECK: encoding: [0x62,0xe5,0x7d,0x28,0x51,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vsqrtnepbf16 -1024(,%rbp,2), %ymm22
+ vsqrtbf16 -1024(,%rbp,2), %ymm22
-// CHECK: vsqrtnepbf16 4064(%rcx), %ymm22 {%k7} {z}
+// CHECK: vsqrtbf16 4064(%rcx), %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x7d,0xaf,0x51,0x71,0x7f]
- vsqrtnepbf16 4064(%rcx), %ymm22 {%k7} {z}
+ vsqrtbf16 4064(%rcx), %ymm22 {%k7} {z}
-// CHECK: vsqrtnepbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
+// CHECK: vsqrtbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x7d,0xbf,0x51,0x72,0x80]
- vsqrtnepbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
+ vsqrtbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z}
-// CHECK: vsqrtnepbf16 268435456(%rbp,%r14,8), %zmm22
+// CHECK: vsqrtbf16 268435456(%rbp,%r14,8), %zmm22
// CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vsqrtnepbf16 268435456(%rbp,%r14,8), %zmm22
+ vsqrtbf16 268435456(%rbp,%r14,8), %zmm22
-// CHECK: vsqrtnepbf16 291(%r8,%rax,4), %zmm22 {%k7}
+// CHECK: vsqrtbf16 291(%r8,%rax,4), %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x7d,0x4f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00]
- vsqrtnepbf16 291(%r8,%rax,4), %zmm22 {%k7}
+ vsqrtbf16 291(%r8,%rax,4), %zmm22 {%k7}
-// CHECK: vsqrtnepbf16 (%rip){1to32}, %zmm22
+// CHECK: vsqrtbf16 (%rip){1to32}, %zmm22
// CHECK: encoding: [0x62,0xe5,0x7d,0x58,0x51,0x35,0x00,0x00,0x00,0x00]
- vsqrtnepbf16 (%rip){1to32}, %zmm22
+ vsqrtbf16 (%rip){1to32}, %zmm22
-// CHECK: vsqrtnepbf16 -2048(,%rbp,2), %zmm22
+// CHECK: vsqrtbf16 -2048(,%rbp,2), %zmm22
// CHECK: encoding: [0x62,0xe5,0x7d,0x48,0x51,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vsqrtnepbf16 -2048(,%rbp,2), %zmm22
+ vsqrtbf16 -2048(,%rbp,2), %zmm22
-// CHECK: vsqrtnepbf16 8128(%rcx), %zmm22 {%k7} {z}
+// CHECK: vsqrtbf16 8128(%rcx), %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x7d,0xcf,0x51,0x71,0x7f]
- vsqrtnepbf16 8128(%rcx), %zmm22 {%k7} {z}
+ vsqrtbf16 8128(%rcx), %zmm22 {%k7} {z}
-// CHECK: vsqrtnepbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
+// CHECK: vsqrtbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x7d,0xdf,0x51,0x72,0x80]
- vsqrtnepbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
+ vsqrtbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z}
-// CHECK: vsubnepbf16 %ymm24, %ymm23, %ymm22
+// CHECK: vsubbf16 %ymm24, %ymm23, %ymm22
// CHECK: encoding: [0x62,0x85,0x45,0x20,0x5c,0xf0]
- vsubnepbf16 %ymm24, %ymm23, %ymm22
+ vsubbf16 %ymm24, %ymm23, %ymm22
-// CHECK: vsubnepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+// CHECK: vsubbf16 %ymm24, %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x27,0x5c,0xf0]
- vsubnepbf16 %ymm24, %ymm23, %ymm22 {%k7}
+ vsubbf16 %ymm24, %ymm23, %ymm22 {%k7}
-// CHECK: vsubnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vsubbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5c,0xf0]
- vsubnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
+ vsubbf16 %ymm24, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vsubnepbf16 %zmm24, %zmm23, %zmm22
+// CHECK: vsubbf16 %zmm24, %zmm23, %zmm22
// CHECK: encoding: [0x62,0x85,0x45,0x40,0x5c,0xf0]
- vsubnepbf16 %zmm24, %zmm23, %zmm22
+ vsubbf16 %zmm24, %zmm23, %zmm22
-// CHECK: vsubnepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+// CHECK: vsubbf16 %zmm24, %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x47,0x5c,0xf0]
- vsubnepbf16 %zmm24, %zmm23, %zmm22 {%k7}
+ vsubbf16 %zmm24, %zmm23, %zmm22 {%k7}
-// CHECK: vsubnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vsubbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5c,0xf0]
- vsubnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
+ vsubbf16 %zmm24, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vsubnepbf16 %xmm24, %xmm23, %xmm22
+// CHECK: vsubbf16 %xmm24, %xmm23, %xmm22
// CHECK: encoding: [0x62,0x85,0x45,0x00,0x5c,0xf0]
- vsubnepbf16 %xmm24, %xmm23, %xmm22
+ vsubbf16 %xmm24, %xmm23, %xmm22
-// CHECK: vsubnepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+// CHECK: vsubbf16 %xmm24, %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0x85,0x45,0x07,0x5c,0xf0]
- vsubnepbf16 %xmm24, %xmm23, %xmm22 {%k7}
+ vsubbf16 %xmm24, %xmm23, %xmm22 {%k7}
-// CHECK: vsubnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vsubbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0x85,0x45,0x87,0x5c,0xf0]
- vsubnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
+ vsubbf16 %xmm24, %xmm23, %xmm22 {%k7} {z}
-// CHECK: vsubnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+// CHECK: vsubbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vsubnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
+ vsubbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22
-// CHECK: vsubnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+// CHECK: vsubbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vsubnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
+ vsubbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7}
-// CHECK: vsubnepbf16 (%rip){1to32}, %zmm23, %zmm22
+// CHECK: vsubbf16 (%rip){1to32}, %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5c,0x35,0x00,0x00,0x00,0x00]
- vsubnepbf16 (%rip){1to32}, %zmm23, %zmm22
+ vsubbf16 (%rip){1to32}, %zmm23, %zmm22
-// CHECK: vsubnepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+// CHECK: vsubbf16 -2048(,%rbp,2), %zmm23, %zmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5c,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vsubnepbf16 -2048(,%rbp,2), %zmm23, %zmm22
+ vsubbf16 -2048(,%rbp,2), %zmm23, %zmm22
-// CHECK: vsubnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+// CHECK: vsubbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5c,0x71,0x7f]
- vsubnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
+ vsubbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z}
-// CHECK: vsubnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+// CHECK: vsubbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5c,0x72,0x80]
- vsubnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
+ vsubbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z}
-// CHECK: vsubnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+// CHECK: vsubbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vsubnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
+ vsubbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22
-// CHECK: vsubnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+// CHECK: vsubbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vsubnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
+ vsubbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7}
-// CHECK: vsubnepbf16 (%rip){1to16}, %ymm23, %ymm22
+// CHECK: vsubbf16 (%rip){1to16}, %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5c,0x35,0x00,0x00,0x00,0x00]
- vsubnepbf16 (%rip){1to16}, %ymm23, %ymm22
+ vsubbf16 (%rip){1to16}, %ymm23, %ymm22
-// CHECK: vsubnepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+// CHECK: vsubbf16 -1024(,%rbp,2), %ymm23, %ymm22
// CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5c,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vsubnepbf16 -1024(,%rbp,2), %ymm23, %ymm22
+ vsubbf16 -1024(,%rbp,2), %ymm23, %ymm22
-// CHECK: vsubnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+// CHECK: vsubbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5c,0x71,0x7f]
- vsubnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
+ vsubbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z}
-// CHECK: vsubnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+// CHECK: vsubbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5c,0x72,0x80]
- vsubnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
+ vsubbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z}
-// CHECK: vsubnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+// CHECK: vsubbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vsubnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
+ vsubbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22
-// CHECK: vsubnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+// CHECK: vsubbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
// CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vsubnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
+ vsubbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7}
-// CHECK: vsubnepbf16 (%rip){1to8}, %xmm23, %xmm22
+// CHECK: vsubbf16 (%rip){1to8}, %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5c,0x35,0x00,0x00,0x00,0x00]
- vsubnepbf16 (%rip){1to8}, %xmm23, %xmm22
+ vsubbf16 (%rip){1to8}, %xmm23, %xmm22
-// CHECK: vsubnepbf16 -512(,%rbp,2), %xmm23, %xmm22
+// CHECK: vsubbf16 -512(,%rbp,2), %xmm23, %xmm22
// CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5c,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vsubnepbf16 -512(,%rbp,2), %xmm23, %xmm22
+ vsubbf16 -512(,%rbp,2), %xmm23, %xmm22
-// CHECK: vsubnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+// CHECK: vsubbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5c,0x71,0x7f]
- vsubnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
+ vsubbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z}
-// CHECK: vsubnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+// CHECK: vsubbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
// CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5c,0x72,0x80]
- vsubnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
+ vsubbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z}
diff --git a/llvm/test/MC/X86/avx10.2-bf16-64-intel.s b/llvm/test/MC/X86/avx10.2-bf16-64-intel.s
index 5f3dc45ba77458..a275979ad0a255 100644
--- a/llvm/test/MC/X86/avx10.2-bf16-64-intel.s
+++ b/llvm/test/MC/X86/avx10.2-bf16-64-intel.s
@@ -1,208 +1,208 @@
// RUN: llvm-mc -triple x86_64 -x86-asm-syntax=intel -output-asm-variant=1 --show-encoding %s | FileCheck %s
-// CHECK: vaddnepbf16 ymm22, ymm23, ymm24
+// CHECK: vaddbf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0x20,0x58,0xf0]
- vaddnepbf16 ymm22, ymm23, ymm24
+ vaddbf16 ymm22, ymm23, ymm24
-// CHECK: vaddnepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vaddbf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0x27,0x58,0xf0]
- vaddnepbf16 ymm22 {k7}, ymm23, ymm24
+ vaddbf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vaddnepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vaddbf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0xa7,0x58,0xf0]
- vaddnepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vaddbf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vaddnepbf16 zmm22, zmm23, zmm24
+// CHECK: vaddbf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0x40,0x58,0xf0]
- vaddnepbf16 zmm22, zmm23, zmm24
+ vaddbf16 zmm22, zmm23, zmm24
-// CHECK: vaddnepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vaddbf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0x47,0x58,0xf0]
- vaddnepbf16 zmm22 {k7}, zmm23, zmm24
+ vaddbf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vaddnepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vaddbf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0xc7,0x58,0xf0]
- vaddnepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vaddbf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vaddnepbf16 xmm22, xmm23, xmm24
+// CHECK: vaddbf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x00,0x58,0xf0]
- vaddnepbf16 xmm22, xmm23, xmm24
+ vaddbf16 xmm22, xmm23, xmm24
-// CHECK: vaddnepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vaddbf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x07,0x58,0xf0]
- vaddnepbf16 xmm22 {k7}, xmm23, xmm24
+ vaddbf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vaddnepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vaddbf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x87,0x58,0xf0]
- vaddnepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vaddbf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vaddnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vaddbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x40,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vaddnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vaddbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vaddnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vaddbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x47,0x58,0xb4,0x80,0x23,0x01,0x00,0x00]
- vaddnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vaddbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vaddnepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vaddbf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe5,0x45,0x50,0x58,0x35,0x00,0x00,0x00,0x00]
- vaddnepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vaddbf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vaddnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vaddbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe5,0x45,0x40,0x58,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vaddnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vaddbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vaddnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vaddbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x58,0x71,0x7f]
- vaddnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vaddbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vaddnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vaddbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x58,0x72,0x80]
- vaddnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vaddbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vaddnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vaddbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x20,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vaddnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vaddbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vaddnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vaddbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x27,0x58,0xb4,0x80,0x23,0x01,0x00,0x00]
- vaddnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vaddbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vaddnepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vaddbf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe5,0x45,0x30,0x58,0x35,0x00,0x00,0x00,0x00]
- vaddnepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vaddbf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vaddnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vaddbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe5,0x45,0x20,0x58,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vaddnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vaddbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vaddnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vaddbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x58,0x71,0x7f]
- vaddnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vaddbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vaddnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vaddbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x58,0x72,0x80]
- vaddnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vaddbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vaddnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vaddbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x00,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vaddnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vaddbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vaddnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vaddbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x07,0x58,0xb4,0x80,0x23,0x01,0x00,0x00]
- vaddnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vaddbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vaddnepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vaddbf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe5,0x45,0x10,0x58,0x35,0x00,0x00,0x00,0x00]
- vaddnepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vaddbf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vaddnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vaddbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe5,0x45,0x00,0x58,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vaddnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vaddbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vaddnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vaddbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe5,0x45,0x87,0x58,0x71,0x7f]
- vaddnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vaddbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vaddnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vaddbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe5,0x45,0x97,0x58,0x72,0x80]
- vaddnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vaddbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vcmppbf16 k5, ymm23, ymm24, 123
+// CHECK: vcmpbf16 k5, ymm23, ymm24, 123
// CHECK: encoding: [0x62,0x93,0x47,0x20,0xc2,0xe8,0x7b]
- vcmppbf16 k5, ymm23, ymm24, 123
+ vcmpbf16 k5, ymm23, ymm24, 123
-// CHECK: vcmppbf16 k5 {k7}, ymm23, ymm24, 123
+// CHECK: vcmpbf16 k5 {k7}, ymm23, ymm24, 123
// CHECK: encoding: [0x62,0x93,0x47,0x27,0xc2,0xe8,0x7b]
- vcmppbf16 k5 {k7}, ymm23, ymm24, 123
+ vcmpbf16 k5 {k7}, ymm23, ymm24, 123
-// CHECK: vcmppbf16 k5, xmm23, xmm24, 123
+// CHECK: vcmpbf16 k5, xmm23, xmm24, 123
// CHECK: encoding: [0x62,0x93,0x47,0x00,0xc2,0xe8,0x7b]
- vcmppbf16 k5, xmm23, xmm24, 123
+ vcmpbf16 k5, xmm23, xmm24, 123
-// CHECK: vcmppbf16 k5 {k7}, xmm23, xmm24, 123
+// CHECK: vcmpbf16 k5 {k7}, xmm23, xmm24, 123
// CHECK: encoding: [0x62,0x93,0x47,0x07,0xc2,0xe8,0x7b]
- vcmppbf16 k5 {k7}, xmm23, xmm24, 123
+ vcmpbf16 k5 {k7}, xmm23, xmm24, 123
-// CHECK: vcmppbf16 k5, zmm23, zmm24, 123
+// CHECK: vcmpbf16 k5, zmm23, zmm24, 123
// CHECK: encoding: [0x62,0x93,0x47,0x40,0xc2,0xe8,0x7b]
- vcmppbf16 k5, zmm23, zmm24, 123
+ vcmpbf16 k5, zmm23, zmm24, 123
-// CHECK: vcmppbf16 k5 {k7}, zmm23, zmm24, 123
+// CHECK: vcmpbf16 k5 {k7}, zmm23, zmm24, 123
// CHECK: encoding: [0x62,0x93,0x47,0x47,0xc2,0xe8,0x7b]
- vcmppbf16 k5 {k7}, zmm23, zmm24, 123
+ vcmpbf16 k5 {k7}, zmm23, zmm24, 123
-// CHECK: vcmppbf16 k5, zmm23, zmmword ptr [rbp + 8*r14 + 268435456], 123
+// CHECK: vcmpbf16 k5, zmm23, zmmword ptr [rbp + 8*r14 + 268435456], 123
// CHECK: encoding: [0x62,0xb3,0x47,0x40,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vcmppbf16 k5, zmm23, zmmword ptr [rbp + 8*r14 + 268435456], 123
+ vcmpbf16 k5, zmm23, zmmword ptr [rbp + 8*r14 + 268435456], 123
-// CHECK: vcmppbf16 k5 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291], 123
+// CHECK: vcmpbf16 k5 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291], 123
// CHECK: encoding: [0x62,0xd3,0x47,0x47,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b]
- vcmppbf16 k5 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291], 123
+ vcmpbf16 k5 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291], 123
-// CHECK: vcmppbf16 k5, zmm23, word ptr [rip]{1to32}, 123
+// CHECK: vcmpbf16 k5, zmm23, word ptr [rip]{1to32}, 123
// CHECK: encoding: [0x62,0xf3,0x47,0x50,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b]
- vcmppbf16 k5, zmm23, word ptr [rip]{1to32}, 123
+ vcmpbf16 k5, zmm23, word ptr [rip]{1to32}, 123
-// CHECK: vcmppbf16 k5, zmm23, zmmword ptr [2*rbp - 2048], 123
+// CHECK: vcmpbf16 k5, zmm23, zmmword ptr [2*rbp - 2048], 123
// CHECK: encoding: [0x62,0xf3,0x47,0x40,0xc2,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vcmppbf16 k5, zmm23, zmmword ptr [2*rbp - 2048], 123
+ vcmpbf16 k5, zmm23, zmmword ptr [2*rbp - 2048], 123
-// CHECK: vcmppbf16 k5 {k7}, zmm23, zmmword ptr [rcx + 8128], 123
+// CHECK: vcmpbf16 k5 {k7}, zmm23, zmmword ptr [rcx + 8128], 123
// CHECK: encoding: [0x62,0xf3,0x47,0x47,0xc2,0x69,0x7f,0x7b]
- vcmppbf16 k5 {k7}, zmm23, zmmword ptr [rcx + 8128], 123
+ vcmpbf16 k5 {k7}, zmm23, zmmword ptr [rcx + 8128], 123
-// CHECK: vcmppbf16 k5 {k7}, zmm23, word ptr [rdx - 256]{1to32}, 123
+// CHECK: vcmpbf16 k5 {k7}, zmm23, word ptr [rdx - 256]{1to32}, 123
// CHECK: encoding: [0x62,0xf3,0x47,0x57,0xc2,0x6a,0x80,0x7b]
- vcmppbf16 k5 {k7}, zmm23, word ptr [rdx - 256]{1to32}, 123
+ vcmpbf16 k5 {k7}, zmm23, word ptr [rdx - 256]{1to32}, 123
-// CHECK: vcmppbf16 k5, xmm23, xmmword ptr [rbp + 8*r14 + 268435456], 123
+// CHECK: vcmpbf16 k5, xmm23, xmmword ptr [rbp + 8*r14 + 268435456], 123
// CHECK: encoding: [0x62,0xb3,0x47,0x00,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vcmppbf16 k5, xmm23, xmmword ptr [rbp + 8*r14 + 268435456], 123
+ vcmpbf16 k5, xmm23, xmmword ptr [rbp + 8*r14 + 268435456], 123
-// CHECK: vcmppbf16 k5 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291], 123
+// CHECK: vcmpbf16 k5 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291], 123
// CHECK: encoding: [0x62,0xd3,0x47,0x07,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b]
- vcmppbf16 k5 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291], 123
+ vcmpbf16 k5 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291], 123
-// CHECK: vcmppbf16 k5, xmm23, word ptr [rip]{1to8}, 123
+// CHECK: vcmpbf16 k5, xmm23, word ptr [rip]{1to8}, 123
// CHECK: encoding: [0x62,0xf3,0x47,0x10,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b]
- vcmppbf16 k5, xmm23, word ptr [rip]{1to8}, 123
+ vcmpbf16 k5, xmm23, word ptr [rip]{1to8}, 123
-// CHECK: vcmppbf16 k5, xmm23, xmmword ptr [2*rbp - 512], 123
+// CHECK: vcmpbf16 k5, xmm23, xmmword ptr [2*rbp - 512], 123
// CHECK: encoding: [0x62,0xf3,0x47,0x00,0xc2,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vcmppbf16 k5, xmm23, xmmword ptr [2*rbp - 512], 123
+ vcmpbf16 k5, xmm23, xmmword ptr [2*rbp - 512], 123
-// CHECK: vcmppbf16 k5 {k7}, xmm23, xmmword ptr [rcx + 2032], 123
+// CHECK: vcmpbf16 k5 {k7}, xmm23, xmmword ptr [rcx + 2032], 123
// CHECK: encoding: [0x62,0xf3,0x47,0x07,0xc2,0x69,0x7f,0x7b]
- vcmppbf16 k5 {k7}, xmm23, xmmword ptr [rcx + 2032], 123
+ vcmpbf16 k5 {k7}, xmm23, xmmword ptr [rcx + 2032], 123
-// CHECK: vcmppbf16 k5 {k7}, xmm23, word ptr [rdx - 256]{1to8}, 123
+// CHECK: vcmpbf16 k5 {k7}, xmm23, word ptr [rdx - 256]{1to8}, 123
// CHECK: encoding: [0x62,0xf3,0x47,0x17,0xc2,0x6a,0x80,0x7b]
- vcmppbf16 k5 {k7}, xmm23, word ptr [rdx - 256]{1to8}, 123
+ vcmpbf16 k5 {k7}, xmm23, word ptr [rdx - 256]{1to8}, 123
-// CHECK: vcmppbf16 k5, ymm23, ymmword ptr [rbp + 8*r14 + 268435456], 123
+// CHECK: vcmpbf16 k5, ymm23, ymmword ptr [rbp + 8*r14 + 268435456], 123
// CHECK: encoding: [0x62,0xb3,0x47,0x20,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vcmppbf16 k5, ymm23, ymmword ptr [rbp + 8*r14 + 268435456], 123
+ vcmpbf16 k5, ymm23, ymmword ptr [rbp + 8*r14 + 268435456], 123
-// CHECK: vcmppbf16 k5 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291], 123
+// CHECK: vcmpbf16 k5 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291], 123
// CHECK: encoding: [0x62,0xd3,0x47,0x27,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b]
- vcmppbf16 k5 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291], 123
+ vcmpbf16 k5 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291], 123
-// CHECK: vcmppbf16 k5, ymm23, word ptr [rip]{1to16}, 123
+// CHECK: vcmpbf16 k5, ymm23, word ptr [rip]{1to16}, 123
// CHECK: encoding: [0x62,0xf3,0x47,0x30,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b]
- vcmppbf16 k5, ymm23, word ptr [rip]{1to16}, 123
+ vcmpbf16 k5, ymm23, word ptr [rip]{1to16}, 123
-// CHECK: vcmppbf16 k5, ymm23, ymmword ptr [2*rbp - 1024], 123
+// CHECK: vcmpbf16 k5, ymm23, ymmword ptr [2*rbp - 1024], 123
// CHECK: encoding: [0x62,0xf3,0x47,0x20,0xc2,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vcmppbf16 k5, ymm23, ymmword ptr [2*rbp - 1024], 123
+ vcmpbf16 k5, ymm23, ymmword ptr [2*rbp - 1024], 123
-// CHECK: vcmppbf16 k5 {k7}, ymm23, ymmword ptr [rcx + 4064], 123
+// CHECK: vcmpbf16 k5 {k7}, ymm23, ymmword ptr [rcx + 4064], 123
// CHECK: encoding: [0x62,0xf3,0x47,0x27,0xc2,0x69,0x7f,0x7b]
- vcmppbf16 k5 {k7}, ymm23, ymmword ptr [rcx + 4064], 123
+ vcmpbf16 k5 {k7}, ymm23, ymmword ptr [rcx + 4064], 123
-// CHECK: vcmppbf16 k5 {k7}, ymm23, word ptr [rdx - 256]{1to16}, 123
+// CHECK: vcmpbf16 k5 {k7}, ymm23, word ptr [rdx - 256]{1to16}, 123
// CHECK: encoding: [0x62,0xf3,0x47,0x37,0xc2,0x6a,0x80,0x7b]
- vcmppbf16 k5 {k7}, ymm23, word ptr [rdx - 256]{1to16}, 123
+ vcmpbf16 k5 {k7}, ymm23, word ptr [rdx - 256]{1to16}, 123
// CHECK: vcomsbf16 xmm22, xmm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x2f,0xf7]
@@ -232,2783 +232,2783 @@
// CHECK: encoding: [0x62,0xe5,0x7d,0x08,0x2f,0x72,0x80]
vcomsbf16 xmm22, word ptr [rdx - 256]
-// CHECK: vdivnepbf16 ymm22, ymm23, ymm24
+// CHECK: vdivbf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0x20,0x5e,0xf0]
- vdivnepbf16 ymm22, ymm23, ymm24
+ vdivbf16 ymm22, ymm23, ymm24
-// CHECK: vdivnepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vdivbf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0x27,0x5e,0xf0]
- vdivnepbf16 ymm22 {k7}, ymm23, ymm24
+ vdivbf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vdivnepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vdivbf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5e,0xf0]
- vdivnepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vdivbf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vdivnepbf16 zmm22, zmm23, zmm24
+// CHECK: vdivbf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0x40,0x5e,0xf0]
- vdivnepbf16 zmm22, zmm23, zmm24
+ vdivbf16 zmm22, zmm23, zmm24
-// CHECK: vdivnepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vdivbf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0x47,0x5e,0xf0]
- vdivnepbf16 zmm22 {k7}, zmm23, zmm24
+ vdivbf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vdivnepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vdivbf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5e,0xf0]
- vdivnepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vdivbf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vdivnepbf16 xmm22, xmm23, xmm24
+// CHECK: vdivbf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x00,0x5e,0xf0]
- vdivnepbf16 xmm22, xmm23, xmm24
+ vdivbf16 xmm22, xmm23, xmm24
-// CHECK: vdivnepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vdivbf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x07,0x5e,0xf0]
- vdivnepbf16 xmm22 {k7}, xmm23, xmm24
+ vdivbf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vdivnepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vdivbf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x87,0x5e,0xf0]
- vdivnepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vdivbf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vdivnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vdivbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vdivnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vdivbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vdivnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vdivbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vdivnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vdivbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vdivnepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vdivbf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5e,0x35,0x00,0x00,0x00,0x00]
- vdivnepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vdivbf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vdivnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vdivbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5e,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vdivnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vdivbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vdivnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vdivbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5e,0x71,0x7f]
- vdivnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vdivbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vdivnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vdivbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5e,0x72,0x80]
- vdivnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vdivbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vdivnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vdivbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vdivnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vdivbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vdivnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vdivbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vdivnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vdivbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vdivnepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vdivbf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5e,0x35,0x00,0x00,0x00,0x00]
- vdivnepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vdivbf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vdivnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vdivbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5e,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vdivnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vdivbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vdivnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vdivbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5e,0x71,0x7f]
- vdivnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vdivbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vdivnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vdivbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5e,0x72,0x80]
- vdivnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vdivbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vdivnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vdivbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vdivnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vdivbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vdivnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vdivbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vdivnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vdivbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vdivnepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vdivbf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5e,0x35,0x00,0x00,0x00,0x00]
- vdivnepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vdivbf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vdivnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vdivbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5e,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vdivnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vdivbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vdivnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vdivbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5e,0x71,0x7f]
- vdivnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vdivbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vdivnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vdivbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5e,0x72,0x80]
- vdivnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vdivbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vfmadd132nepbf16 ymm22, ymm23, ymm24
+// CHECK: vfmadd132bf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x20,0x98,0xf0]
- vfmadd132nepbf16 ymm22, ymm23, ymm24
+ vfmadd132bf16 ymm22, ymm23, ymm24
-// CHECK: vfmadd132nepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vfmadd132bf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x27,0x98,0xf0]
- vfmadd132nepbf16 ymm22 {k7}, ymm23, ymm24
+ vfmadd132bf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vfmadd132bf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0x98,0xf0]
- vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vfmadd132bf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vfmadd132nepbf16 zmm22, zmm23, zmm24
+// CHECK: vfmadd132bf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x40,0x98,0xf0]
- vfmadd132nepbf16 zmm22, zmm23, zmm24
+ vfmadd132bf16 zmm22, zmm23, zmm24
-// CHECK: vfmadd132nepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vfmadd132bf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x47,0x98,0xf0]
- vfmadd132nepbf16 zmm22 {k7}, zmm23, zmm24
+ vfmadd132bf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vfmadd132bf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0x98,0xf0]
- vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vfmadd132bf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vfmadd132nepbf16 xmm22, xmm23, xmm24
+// CHECK: vfmadd132bf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x00,0x98,0xf0]
- vfmadd132nepbf16 xmm22, xmm23, xmm24
+ vfmadd132bf16 xmm22, xmm23, xmm24
-// CHECK: vfmadd132nepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vfmadd132bf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x07,0x98,0xf0]
- vfmadd132nepbf16 xmm22 {k7}, xmm23, xmm24
+ vfmadd132bf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vfmadd132bf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x87,0x98,0xf0]
- vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vfmadd132bf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vfmadd132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmadd132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vfmadd132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmadd132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmadd132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0x98,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vfmadd132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmadd132nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vfmadd132bf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0x98,0x35,0x00,0x00,0x00,0x00]
- vfmadd132nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vfmadd132bf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vfmadd132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vfmadd132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0x98,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfmadd132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vfmadd132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vfmadd132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x98,0x71,0x7f]
- vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vfmadd132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vfmadd132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x98,0x72,0x80]
- vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vfmadd132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vfmadd132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmadd132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vfmadd132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmadd132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmadd132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0x98,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vfmadd132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmadd132nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vfmadd132bf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0x98,0x35,0x00,0x00,0x00,0x00]
- vfmadd132nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vfmadd132bf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vfmadd132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vfmadd132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0x98,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfmadd132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vfmadd132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vfmadd132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x98,0x71,0x7f]
- vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vfmadd132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vfmadd132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x98,0x72,0x80]
- vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vfmadd132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vfmadd132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmadd132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vfmadd132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmadd132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmadd132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0x98,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vfmadd132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmadd132nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vfmadd132bf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0x98,0x35,0x00,0x00,0x00,0x00]
- vfmadd132nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vfmadd132bf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vfmadd132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vfmadd132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0x98,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfmadd132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vfmadd132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vfmadd132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0x98,0x71,0x7f]
- vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vfmadd132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vfmadd132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0x98,0x72,0x80]
- vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vfmadd132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vfmadd213nepbf16 ymm22, ymm23, ymm24
+// CHECK: vfmadd213bf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xa8,0xf0]
- vfmadd213nepbf16 ymm22, ymm23, ymm24
+ vfmadd213bf16 ymm22, ymm23, ymm24
-// CHECK: vfmadd213nepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vfmadd213bf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xa8,0xf0]
- vfmadd213nepbf16 ymm22 {k7}, ymm23, ymm24
+ vfmadd213bf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vfmadd213bf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xa8,0xf0]
- vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vfmadd213bf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vfmadd213nepbf16 zmm22, zmm23, zmm24
+// CHECK: vfmadd213bf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xa8,0xf0]
- vfmadd213nepbf16 zmm22, zmm23, zmm24
+ vfmadd213bf16 zmm22, zmm23, zmm24
-// CHECK: vfmadd213nepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vfmadd213bf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xa8,0xf0]
- vfmadd213nepbf16 zmm22 {k7}, zmm23, zmm24
+ vfmadd213bf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vfmadd213bf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xa8,0xf0]
- vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vfmadd213bf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vfmadd213nepbf16 xmm22, xmm23, xmm24
+// CHECK: vfmadd213bf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xa8,0xf0]
- vfmadd213nepbf16 xmm22, xmm23, xmm24
+ vfmadd213bf16 xmm22, xmm23, xmm24
-// CHECK: vfmadd213nepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vfmadd213bf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xa8,0xf0]
- vfmadd213nepbf16 xmm22 {k7}, xmm23, xmm24
+ vfmadd213bf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vfmadd213bf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xa8,0xf0]
- vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vfmadd213bf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vfmadd213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmadd213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vfmadd213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmadd213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmadd213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vfmadd213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmadd213nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vfmadd213bf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xa8,0x35,0x00,0x00,0x00,0x00]
- vfmadd213nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vfmadd213bf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vfmadd213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vfmadd213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xa8,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfmadd213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vfmadd213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vfmadd213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xa8,0x71,0x7f]
- vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vfmadd213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vfmadd213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xa8,0x72,0x80]
- vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vfmadd213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vfmadd213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmadd213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vfmadd213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmadd213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmadd213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vfmadd213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmadd213nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vfmadd213bf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xa8,0x35,0x00,0x00,0x00,0x00]
- vfmadd213nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vfmadd213bf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vfmadd213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vfmadd213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xa8,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfmadd213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vfmadd213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vfmadd213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xa8,0x71,0x7f]
- vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vfmadd213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vfmadd213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xa8,0x72,0x80]
- vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vfmadd213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vfmadd213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmadd213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vfmadd213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmadd213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmadd213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vfmadd213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmadd213nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vfmadd213bf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xa8,0x35,0x00,0x00,0x00,0x00]
- vfmadd213nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vfmadd213bf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vfmadd213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vfmadd213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xa8,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfmadd213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vfmadd213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vfmadd213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xa8,0x71,0x7f]
- vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vfmadd213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vfmadd213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xa8,0x72,0x80]
- vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vfmadd213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vfmadd231nepbf16 ymm22, ymm23, ymm24
+// CHECK: vfmadd231bf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xb8,0xf0]
- vfmadd231nepbf16 ymm22, ymm23, ymm24
+ vfmadd231bf16 ymm22, ymm23, ymm24
-// CHECK: vfmadd231nepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vfmadd231bf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xb8,0xf0]
- vfmadd231nepbf16 ymm22 {k7}, ymm23, ymm24
+ vfmadd231bf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vfmadd231bf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xb8,0xf0]
- vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vfmadd231bf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vfmadd231nepbf16 zmm22, zmm23, zmm24
+// CHECK: vfmadd231bf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xb8,0xf0]
- vfmadd231nepbf16 zmm22, zmm23, zmm24
+ vfmadd231bf16 zmm22, zmm23, zmm24
-// CHECK: vfmadd231nepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vfmadd231bf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xb8,0xf0]
- vfmadd231nepbf16 zmm22 {k7}, zmm23, zmm24
+ vfmadd231bf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vfmadd231bf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xb8,0xf0]
- vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vfmadd231bf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vfmadd231nepbf16 xmm22, xmm23, xmm24
+// CHECK: vfmadd231bf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xb8,0xf0]
- vfmadd231nepbf16 xmm22, xmm23, xmm24
+ vfmadd231bf16 xmm22, xmm23, xmm24
-// CHECK: vfmadd231nepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vfmadd231bf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xb8,0xf0]
- vfmadd231nepbf16 xmm22 {k7}, xmm23, xmm24
+ vfmadd231bf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vfmadd231bf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xb8,0xf0]
- vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vfmadd231bf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vfmadd231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmadd231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vfmadd231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmadd231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmadd231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vfmadd231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmadd231nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vfmadd231bf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xb8,0x35,0x00,0x00,0x00,0x00]
- vfmadd231nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vfmadd231bf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vfmadd231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vfmadd231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xb8,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfmadd231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vfmadd231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vfmadd231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xb8,0x71,0x7f]
- vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vfmadd231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vfmadd231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xb8,0x72,0x80]
- vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vfmadd231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vfmadd231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmadd231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vfmadd231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmadd231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmadd231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vfmadd231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmadd231nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vfmadd231bf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xb8,0x35,0x00,0x00,0x00,0x00]
- vfmadd231nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vfmadd231bf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vfmadd231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vfmadd231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xb8,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfmadd231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vfmadd231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vfmadd231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xb8,0x71,0x7f]
- vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vfmadd231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vfmadd231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xb8,0x72,0x80]
- vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vfmadd231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vfmadd231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmadd231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmadd231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vfmadd231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmadd231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmadd231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmadd231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vfmadd231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmadd231nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vfmadd231bf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xb8,0x35,0x00,0x00,0x00,0x00]
- vfmadd231nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vfmadd231bf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vfmadd231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vfmadd231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xb8,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfmadd231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vfmadd231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vfmadd231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xb8,0x71,0x7f]
- vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vfmadd231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vfmadd231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xb8,0x72,0x80]
- vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vfmadd231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vfmsub132nepbf16 ymm22, ymm23, ymm24
+// CHECK: vfmsub132bf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x20,0x9a,0xf0]
- vfmsub132nepbf16 ymm22, ymm23, ymm24
+ vfmsub132bf16 ymm22, ymm23, ymm24
-// CHECK: vfmsub132nepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vfmsub132bf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x27,0x9a,0xf0]
- vfmsub132nepbf16 ymm22 {k7}, ymm23, ymm24
+ vfmsub132bf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vfmsub132bf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0x9a,0xf0]
- vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vfmsub132bf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vfmsub132nepbf16 zmm22, zmm23, zmm24
+// CHECK: vfmsub132bf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x40,0x9a,0xf0]
- vfmsub132nepbf16 zmm22, zmm23, zmm24
+ vfmsub132bf16 zmm22, zmm23, zmm24
-// CHECK: vfmsub132nepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vfmsub132bf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x47,0x9a,0xf0]
- vfmsub132nepbf16 zmm22 {k7}, zmm23, zmm24
+ vfmsub132bf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vfmsub132bf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0x9a,0xf0]
- vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vfmsub132bf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vfmsub132nepbf16 xmm22, xmm23, xmm24
+// CHECK: vfmsub132bf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x00,0x9a,0xf0]
- vfmsub132nepbf16 xmm22, xmm23, xmm24
+ vfmsub132bf16 xmm22, xmm23, xmm24
-// CHECK: vfmsub132nepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vfmsub132bf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x07,0x9a,0xf0]
- vfmsub132nepbf16 xmm22 {k7}, xmm23, xmm24
+ vfmsub132bf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vfmsub132bf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x87,0x9a,0xf0]
- vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vfmsub132bf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vfmsub132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmsub132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vfmsub132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmsub132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmsub132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vfmsub132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmsub132nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vfmsub132bf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0x9a,0x35,0x00,0x00,0x00,0x00]
- vfmsub132nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vfmsub132bf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vfmsub132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vfmsub132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0x9a,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfmsub132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vfmsub132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vfmsub132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x9a,0x71,0x7f]
- vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vfmsub132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vfmsub132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x9a,0x72,0x80]
- vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vfmsub132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vfmsub132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmsub132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vfmsub132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmsub132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmsub132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vfmsub132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmsub132nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vfmsub132bf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0x9a,0x35,0x00,0x00,0x00,0x00]
- vfmsub132nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vfmsub132bf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vfmsub132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vfmsub132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0x9a,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfmsub132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vfmsub132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vfmsub132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x9a,0x71,0x7f]
- vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vfmsub132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vfmsub132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x9a,0x72,0x80]
- vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vfmsub132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vfmsub132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmsub132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vfmsub132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmsub132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmsub132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vfmsub132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmsub132nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vfmsub132bf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0x9a,0x35,0x00,0x00,0x00,0x00]
- vfmsub132nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vfmsub132bf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vfmsub132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vfmsub132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0x9a,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfmsub132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vfmsub132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vfmsub132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0x9a,0x71,0x7f]
- vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vfmsub132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vfmsub132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0x9a,0x72,0x80]
- vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vfmsub132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vfmsub213nepbf16 ymm22, ymm23, ymm24
+// CHECK: vfmsub213bf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xaa,0xf0]
- vfmsub213nepbf16 ymm22, ymm23, ymm24
+ vfmsub213bf16 ymm22, ymm23, ymm24
-// CHECK: vfmsub213nepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vfmsub213bf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xaa,0xf0]
- vfmsub213nepbf16 ymm22 {k7}, ymm23, ymm24
+ vfmsub213bf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vfmsub213bf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xaa,0xf0]
- vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vfmsub213bf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vfmsub213nepbf16 zmm22, zmm23, zmm24
+// CHECK: vfmsub213bf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xaa,0xf0]
- vfmsub213nepbf16 zmm22, zmm23, zmm24
+ vfmsub213bf16 zmm22, zmm23, zmm24
-// CHECK: vfmsub213nepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vfmsub213bf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xaa,0xf0]
- vfmsub213nepbf16 zmm22 {k7}, zmm23, zmm24
+ vfmsub213bf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vfmsub213bf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xaa,0xf0]
- vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vfmsub213bf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vfmsub213nepbf16 xmm22, xmm23, xmm24
+// CHECK: vfmsub213bf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xaa,0xf0]
- vfmsub213nepbf16 xmm22, xmm23, xmm24
+ vfmsub213bf16 xmm22, xmm23, xmm24
-// CHECK: vfmsub213nepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vfmsub213bf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xaa,0xf0]
- vfmsub213nepbf16 xmm22 {k7}, xmm23, xmm24
+ vfmsub213bf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vfmsub213bf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xaa,0xf0]
- vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vfmsub213bf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vfmsub213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmsub213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vfmsub213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmsub213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmsub213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vfmsub213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmsub213nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vfmsub213bf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xaa,0x35,0x00,0x00,0x00,0x00]
- vfmsub213nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vfmsub213bf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vfmsub213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vfmsub213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xaa,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfmsub213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vfmsub213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vfmsub213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xaa,0x71,0x7f]
- vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vfmsub213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vfmsub213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xaa,0x72,0x80]
- vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vfmsub213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vfmsub213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmsub213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vfmsub213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmsub213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmsub213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vfmsub213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmsub213nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vfmsub213bf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xaa,0x35,0x00,0x00,0x00,0x00]
- vfmsub213nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vfmsub213bf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vfmsub213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vfmsub213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xaa,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfmsub213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vfmsub213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vfmsub213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xaa,0x71,0x7f]
- vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vfmsub213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vfmsub213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xaa,0x72,0x80]
- vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vfmsub213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vfmsub213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmsub213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vfmsub213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmsub213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmsub213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vfmsub213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmsub213nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vfmsub213bf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xaa,0x35,0x00,0x00,0x00,0x00]
- vfmsub213nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vfmsub213bf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vfmsub213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vfmsub213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xaa,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfmsub213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vfmsub213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vfmsub213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xaa,0x71,0x7f]
- vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vfmsub213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vfmsub213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xaa,0x72,0x80]
- vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vfmsub213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vfmsub231nepbf16 ymm22, ymm23, ymm24
+// CHECK: vfmsub231bf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xba,0xf0]
- vfmsub231nepbf16 ymm22, ymm23, ymm24
+ vfmsub231bf16 ymm22, ymm23, ymm24
-// CHECK: vfmsub231nepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vfmsub231bf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xba,0xf0]
- vfmsub231nepbf16 ymm22 {k7}, ymm23, ymm24
+ vfmsub231bf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vfmsub231bf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xba,0xf0]
- vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vfmsub231bf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vfmsub231nepbf16 zmm22, zmm23, zmm24
+// CHECK: vfmsub231bf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xba,0xf0]
- vfmsub231nepbf16 zmm22, zmm23, zmm24
+ vfmsub231bf16 zmm22, zmm23, zmm24
-// CHECK: vfmsub231nepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vfmsub231bf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xba,0xf0]
- vfmsub231nepbf16 zmm22 {k7}, zmm23, zmm24
+ vfmsub231bf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vfmsub231bf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xba,0xf0]
- vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vfmsub231bf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vfmsub231nepbf16 xmm22, xmm23, xmm24
+// CHECK: vfmsub231bf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xba,0xf0]
- vfmsub231nepbf16 xmm22, xmm23, xmm24
+ vfmsub231bf16 xmm22, xmm23, xmm24
-// CHECK: vfmsub231nepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vfmsub231bf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xba,0xf0]
- vfmsub231nepbf16 xmm22 {k7}, xmm23, xmm24
+ vfmsub231bf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vfmsub231bf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xba,0xf0]
- vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vfmsub231bf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vfmsub231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmsub231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vfmsub231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmsub231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmsub231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xba,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vfmsub231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmsub231nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vfmsub231bf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xba,0x35,0x00,0x00,0x00,0x00]
- vfmsub231nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vfmsub231bf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vfmsub231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vfmsub231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xba,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfmsub231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vfmsub231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vfmsub231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xba,0x71,0x7f]
- vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vfmsub231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vfmsub231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xba,0x72,0x80]
- vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vfmsub231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vfmsub231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmsub231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vfmsub231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmsub231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmsub231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xba,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vfmsub231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmsub231nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vfmsub231bf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xba,0x35,0x00,0x00,0x00,0x00]
- vfmsub231nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vfmsub231bf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vfmsub231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vfmsub231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xba,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfmsub231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vfmsub231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vfmsub231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xba,0x71,0x7f]
- vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vfmsub231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vfmsub231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xba,0x72,0x80]
- vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vfmsub231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vfmsub231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfmsub231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfmsub231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vfmsub231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfmsub231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfmsub231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xba,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfmsub231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vfmsub231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfmsub231nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vfmsub231bf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xba,0x35,0x00,0x00,0x00,0x00]
- vfmsub231nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vfmsub231bf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vfmsub231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vfmsub231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xba,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfmsub231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vfmsub231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vfmsub231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xba,0x71,0x7f]
- vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vfmsub231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vfmsub231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xba,0x72,0x80]
- vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vfmsub231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vfnmadd132nepbf16 ymm22, ymm23, ymm24
+// CHECK: vfnmadd132bf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x20,0x9c,0xf0]
- vfnmadd132nepbf16 ymm22, ymm23, ymm24
+ vfnmadd132bf16 ymm22, ymm23, ymm24
-// CHECK: vfnmadd132nepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vfnmadd132bf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x27,0x9c,0xf0]
- vfnmadd132nepbf16 ymm22 {k7}, ymm23, ymm24
+ vfnmadd132bf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vfnmadd132bf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0x9c,0xf0]
- vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vfnmadd132bf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vfnmadd132nepbf16 zmm22, zmm23, zmm24
+// CHECK: vfnmadd132bf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x40,0x9c,0xf0]
- vfnmadd132nepbf16 zmm22, zmm23, zmm24
+ vfnmadd132bf16 zmm22, zmm23, zmm24
-// CHECK: vfnmadd132nepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vfnmadd132bf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x47,0x9c,0xf0]
- vfnmadd132nepbf16 zmm22 {k7}, zmm23, zmm24
+ vfnmadd132bf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vfnmadd132bf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0x9c,0xf0]
- vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vfnmadd132bf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vfnmadd132nepbf16 xmm22, xmm23, xmm24
+// CHECK: vfnmadd132bf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x00,0x9c,0xf0]
- vfnmadd132nepbf16 xmm22, xmm23, xmm24
+ vfnmadd132bf16 xmm22, xmm23, xmm24
-// CHECK: vfnmadd132nepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vfnmadd132bf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x07,0x9c,0xf0]
- vfnmadd132nepbf16 xmm22 {k7}, xmm23, xmm24
+ vfnmadd132bf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vfnmadd132bf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x87,0x9c,0xf0]
- vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vfnmadd132bf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vfnmadd132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmadd132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vfnmadd132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmadd132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmadd132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vfnmadd132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmadd132nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vfnmadd132bf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0x9c,0x35,0x00,0x00,0x00,0x00]
- vfnmadd132nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vfnmadd132bf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vfnmadd132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vfnmadd132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0x9c,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfnmadd132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vfnmadd132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vfnmadd132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x9c,0x71,0x7f]
- vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vfnmadd132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vfnmadd132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x9c,0x72,0x80]
- vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vfnmadd132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vfnmadd132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmadd132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vfnmadd132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmadd132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmadd132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vfnmadd132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmadd132nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vfnmadd132bf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0x9c,0x35,0x00,0x00,0x00,0x00]
- vfnmadd132nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vfnmadd132bf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vfnmadd132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vfnmadd132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0x9c,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfnmadd132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vfnmadd132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vfnmadd132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x9c,0x71,0x7f]
- vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vfnmadd132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vfnmadd132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x9c,0x72,0x80]
- vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vfnmadd132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vfnmadd132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmadd132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vfnmadd132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmadd132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmadd132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vfnmadd132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmadd132nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vfnmadd132bf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0x9c,0x35,0x00,0x00,0x00,0x00]
- vfnmadd132nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vfnmadd132bf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vfnmadd132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vfnmadd132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0x9c,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfnmadd132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vfnmadd132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vfnmadd132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0x9c,0x71,0x7f]
- vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vfnmadd132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vfnmadd132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0x9c,0x72,0x80]
- vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vfnmadd132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vfnmadd213nepbf16 ymm22, ymm23, ymm24
+// CHECK: vfnmadd213bf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xac,0xf0]
- vfnmadd213nepbf16 ymm22, ymm23, ymm24
+ vfnmadd213bf16 ymm22, ymm23, ymm24
-// CHECK: vfnmadd213nepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vfnmadd213bf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xac,0xf0]
- vfnmadd213nepbf16 ymm22 {k7}, ymm23, ymm24
+ vfnmadd213bf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vfnmadd213bf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xac,0xf0]
- vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vfnmadd213bf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vfnmadd213nepbf16 zmm22, zmm23, zmm24
+// CHECK: vfnmadd213bf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xac,0xf0]
- vfnmadd213nepbf16 zmm22, zmm23, zmm24
+ vfnmadd213bf16 zmm22, zmm23, zmm24
-// CHECK: vfnmadd213nepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vfnmadd213bf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xac,0xf0]
- vfnmadd213nepbf16 zmm22 {k7}, zmm23, zmm24
+ vfnmadd213bf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vfnmadd213bf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xac,0xf0]
- vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vfnmadd213bf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vfnmadd213nepbf16 xmm22, xmm23, xmm24
+// CHECK: vfnmadd213bf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xac,0xf0]
- vfnmadd213nepbf16 xmm22, xmm23, xmm24
+ vfnmadd213bf16 xmm22, xmm23, xmm24
-// CHECK: vfnmadd213nepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vfnmadd213bf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xac,0xf0]
- vfnmadd213nepbf16 xmm22 {k7}, xmm23, xmm24
+ vfnmadd213bf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vfnmadd213bf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xac,0xf0]
- vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vfnmadd213bf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vfnmadd213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmadd213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vfnmadd213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmadd213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmadd213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xac,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vfnmadd213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmadd213nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vfnmadd213bf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xac,0x35,0x00,0x00,0x00,0x00]
- vfnmadd213nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vfnmadd213bf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vfnmadd213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vfnmadd213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xac,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfnmadd213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vfnmadd213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vfnmadd213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xac,0x71,0x7f]
- vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vfnmadd213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vfnmadd213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xac,0x72,0x80]
- vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vfnmadd213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vfnmadd213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmadd213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vfnmadd213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmadd213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmadd213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xac,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vfnmadd213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmadd213nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vfnmadd213bf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xac,0x35,0x00,0x00,0x00,0x00]
- vfnmadd213nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vfnmadd213bf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vfnmadd213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vfnmadd213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xac,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfnmadd213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vfnmadd213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vfnmadd213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xac,0x71,0x7f]
- vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vfnmadd213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vfnmadd213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xac,0x72,0x80]
- vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vfnmadd213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vfnmadd213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmadd213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vfnmadd213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmadd213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmadd213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xac,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vfnmadd213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmadd213nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vfnmadd213bf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xac,0x35,0x00,0x00,0x00,0x00]
- vfnmadd213nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vfnmadd213bf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vfnmadd213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vfnmadd213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xac,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfnmadd213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vfnmadd213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vfnmadd213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xac,0x71,0x7f]
- vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vfnmadd213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vfnmadd213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xac,0x72,0x80]
- vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vfnmadd213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vfnmadd231nepbf16 ymm22, ymm23, ymm24
+// CHECK: vfnmadd231bf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xbc,0xf0]
- vfnmadd231nepbf16 ymm22, ymm23, ymm24
+ vfnmadd231bf16 ymm22, ymm23, ymm24
-// CHECK: vfnmadd231nepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vfnmadd231bf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xbc,0xf0]
- vfnmadd231nepbf16 ymm22 {k7}, ymm23, ymm24
+ vfnmadd231bf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vfnmadd231bf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xbc,0xf0]
- vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vfnmadd231bf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vfnmadd231nepbf16 zmm22, zmm23, zmm24
+// CHECK: vfnmadd231bf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xbc,0xf0]
- vfnmadd231nepbf16 zmm22, zmm23, zmm24
+ vfnmadd231bf16 zmm22, zmm23, zmm24
-// CHECK: vfnmadd231nepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vfnmadd231bf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xbc,0xf0]
- vfnmadd231nepbf16 zmm22 {k7}, zmm23, zmm24
+ vfnmadd231bf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vfnmadd231bf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xbc,0xf0]
- vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vfnmadd231bf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vfnmadd231nepbf16 xmm22, xmm23, xmm24
+// CHECK: vfnmadd231bf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xbc,0xf0]
- vfnmadd231nepbf16 xmm22, xmm23, xmm24
+ vfnmadd231bf16 xmm22, xmm23, xmm24
-// CHECK: vfnmadd231nepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vfnmadd231bf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xbc,0xf0]
- vfnmadd231nepbf16 xmm22 {k7}, xmm23, xmm24
+ vfnmadd231bf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vfnmadd231bf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xbc,0xf0]
- vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vfnmadd231bf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vfnmadd231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmadd231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vfnmadd231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmadd231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmadd231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vfnmadd231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmadd231nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vfnmadd231bf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xbc,0x35,0x00,0x00,0x00,0x00]
- vfnmadd231nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vfnmadd231bf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vfnmadd231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vfnmadd231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xbc,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfnmadd231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vfnmadd231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vfnmadd231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xbc,0x71,0x7f]
- vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vfnmadd231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vfnmadd231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xbc,0x72,0x80]
- vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vfnmadd231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vfnmadd231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmadd231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vfnmadd231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmadd231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmadd231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vfnmadd231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmadd231nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vfnmadd231bf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xbc,0x35,0x00,0x00,0x00,0x00]
- vfnmadd231nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vfnmadd231bf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vfnmadd231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vfnmadd231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xbc,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfnmadd231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vfnmadd231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vfnmadd231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xbc,0x71,0x7f]
- vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vfnmadd231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vfnmadd231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xbc,0x72,0x80]
- vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vfnmadd231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vfnmadd231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmadd231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmadd231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vfnmadd231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmadd231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmadd231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmadd231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vfnmadd231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmadd231nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vfnmadd231bf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xbc,0x35,0x00,0x00,0x00,0x00]
- vfnmadd231nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vfnmadd231bf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vfnmadd231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vfnmadd231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xbc,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfnmadd231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vfnmadd231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vfnmadd231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xbc,0x71,0x7f]
- vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vfnmadd231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vfnmadd231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xbc,0x72,0x80]
- vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vfnmadd231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vfnmsub132nepbf16 ymm22, ymm23, ymm24
+// CHECK: vfnmsub132bf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x20,0x9e,0xf0]
- vfnmsub132nepbf16 ymm22, ymm23, ymm24
+ vfnmsub132bf16 ymm22, ymm23, ymm24
-// CHECK: vfnmsub132nepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vfnmsub132bf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x27,0x9e,0xf0]
- vfnmsub132nepbf16 ymm22 {k7}, ymm23, ymm24
+ vfnmsub132bf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vfnmsub132bf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0x9e,0xf0]
- vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vfnmsub132bf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vfnmsub132nepbf16 zmm22, zmm23, zmm24
+// CHECK: vfnmsub132bf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x40,0x9e,0xf0]
- vfnmsub132nepbf16 zmm22, zmm23, zmm24
+ vfnmsub132bf16 zmm22, zmm23, zmm24
-// CHECK: vfnmsub132nepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vfnmsub132bf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x47,0x9e,0xf0]
- vfnmsub132nepbf16 zmm22 {k7}, zmm23, zmm24
+ vfnmsub132bf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vfnmsub132bf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0x9e,0xf0]
- vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vfnmsub132bf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vfnmsub132nepbf16 xmm22, xmm23, xmm24
+// CHECK: vfnmsub132bf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x00,0x9e,0xf0]
- vfnmsub132nepbf16 xmm22, xmm23, xmm24
+ vfnmsub132bf16 xmm22, xmm23, xmm24
-// CHECK: vfnmsub132nepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vfnmsub132bf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x07,0x9e,0xf0]
- vfnmsub132nepbf16 xmm22 {k7}, xmm23, xmm24
+ vfnmsub132bf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vfnmsub132bf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x87,0x9e,0xf0]
- vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vfnmsub132bf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vfnmsub132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmsub132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vfnmsub132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmsub132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmsub132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vfnmsub132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmsub132nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vfnmsub132bf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0x9e,0x35,0x00,0x00,0x00,0x00]
- vfnmsub132nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vfnmsub132bf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vfnmsub132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vfnmsub132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0x9e,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfnmsub132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vfnmsub132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vfnmsub132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x9e,0x71,0x7f]
- vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vfnmsub132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vfnmsub132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x9e,0x72,0x80]
- vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vfnmsub132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vfnmsub132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmsub132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vfnmsub132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmsub132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmsub132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vfnmsub132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmsub132nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vfnmsub132bf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0x9e,0x35,0x00,0x00,0x00,0x00]
- vfnmsub132nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vfnmsub132bf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vfnmsub132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vfnmsub132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0x9e,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfnmsub132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vfnmsub132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vfnmsub132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x9e,0x71,0x7f]
- vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vfnmsub132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vfnmsub132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x9e,0x72,0x80]
- vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vfnmsub132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vfnmsub132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmsub132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vfnmsub132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmsub132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmsub132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vfnmsub132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmsub132nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vfnmsub132bf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0x9e,0x35,0x00,0x00,0x00,0x00]
- vfnmsub132nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vfnmsub132bf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vfnmsub132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vfnmsub132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0x9e,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfnmsub132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vfnmsub132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vfnmsub132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0x9e,0x71,0x7f]
- vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vfnmsub132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vfnmsub132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0x9e,0x72,0x80]
- vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vfnmsub132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vfnmsub213nepbf16 ymm22, ymm23, ymm24
+// CHECK: vfnmsub213bf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xae,0xf0]
- vfnmsub213nepbf16 ymm22, ymm23, ymm24
+ vfnmsub213bf16 ymm22, ymm23, ymm24
-// CHECK: vfnmsub213nepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vfnmsub213bf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xae,0xf0]
- vfnmsub213nepbf16 ymm22 {k7}, ymm23, ymm24
+ vfnmsub213bf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vfnmsub213bf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xae,0xf0]
- vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vfnmsub213bf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vfnmsub213nepbf16 zmm22, zmm23, zmm24
+// CHECK: vfnmsub213bf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xae,0xf0]
- vfnmsub213nepbf16 zmm22, zmm23, zmm24
+ vfnmsub213bf16 zmm22, zmm23, zmm24
-// CHECK: vfnmsub213nepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vfnmsub213bf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xae,0xf0]
- vfnmsub213nepbf16 zmm22 {k7}, zmm23, zmm24
+ vfnmsub213bf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vfnmsub213bf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xae,0xf0]
- vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vfnmsub213bf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vfnmsub213nepbf16 xmm22, xmm23, xmm24
+// CHECK: vfnmsub213bf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xae,0xf0]
- vfnmsub213nepbf16 xmm22, xmm23, xmm24
+ vfnmsub213bf16 xmm22, xmm23, xmm24
-// CHECK: vfnmsub213nepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vfnmsub213bf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xae,0xf0]
- vfnmsub213nepbf16 xmm22 {k7}, xmm23, xmm24
+ vfnmsub213bf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vfnmsub213bf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xae,0xf0]
- vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vfnmsub213bf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vfnmsub213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmsub213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vfnmsub213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmsub213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmsub213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xae,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vfnmsub213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmsub213nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vfnmsub213bf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xae,0x35,0x00,0x00,0x00,0x00]
- vfnmsub213nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vfnmsub213bf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vfnmsub213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vfnmsub213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xae,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfnmsub213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vfnmsub213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vfnmsub213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xae,0x71,0x7f]
- vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vfnmsub213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vfnmsub213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xae,0x72,0x80]
- vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vfnmsub213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vfnmsub213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmsub213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vfnmsub213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmsub213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmsub213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xae,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vfnmsub213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmsub213nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vfnmsub213bf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xae,0x35,0x00,0x00,0x00,0x00]
- vfnmsub213nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vfnmsub213bf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vfnmsub213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vfnmsub213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xae,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfnmsub213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vfnmsub213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vfnmsub213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xae,0x71,0x7f]
- vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vfnmsub213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vfnmsub213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xae,0x72,0x80]
- vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vfnmsub213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vfnmsub213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmsub213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vfnmsub213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmsub213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmsub213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xae,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vfnmsub213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmsub213nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vfnmsub213bf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xae,0x35,0x00,0x00,0x00,0x00]
- vfnmsub213nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vfnmsub213bf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vfnmsub213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vfnmsub213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xae,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfnmsub213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vfnmsub213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vfnmsub213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xae,0x71,0x7f]
- vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vfnmsub213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vfnmsub213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xae,0x72,0x80]
- vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vfnmsub213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vfnmsub231nepbf16 ymm22, ymm23, ymm24
+// CHECK: vfnmsub231bf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x20,0xbe,0xf0]
- vfnmsub231nepbf16 ymm22, ymm23, ymm24
+ vfnmsub231bf16 ymm22, ymm23, ymm24
-// CHECK: vfnmsub231nepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vfnmsub231bf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x27,0xbe,0xf0]
- vfnmsub231nepbf16 ymm22 {k7}, ymm23, ymm24
+ vfnmsub231bf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vfnmsub231bf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0xbe,0xf0]
- vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vfnmsub231bf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vfnmsub231nepbf16 zmm22, zmm23, zmm24
+// CHECK: vfnmsub231bf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x40,0xbe,0xf0]
- vfnmsub231nepbf16 zmm22, zmm23, zmm24
+ vfnmsub231bf16 zmm22, zmm23, zmm24
-// CHECK: vfnmsub231nepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vfnmsub231bf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x47,0xbe,0xf0]
- vfnmsub231nepbf16 zmm22 {k7}, zmm23, zmm24
+ vfnmsub231bf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vfnmsub231bf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0xbe,0xf0]
- vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vfnmsub231bf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vfnmsub231nepbf16 xmm22, xmm23, xmm24
+// CHECK: vfnmsub231bf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x00,0xbe,0xf0]
- vfnmsub231nepbf16 xmm22, xmm23, xmm24
+ vfnmsub231bf16 xmm22, xmm23, xmm24
-// CHECK: vfnmsub231nepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vfnmsub231bf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x07,0xbe,0xf0]
- vfnmsub231nepbf16 xmm22 {k7}, xmm23, xmm24
+ vfnmsub231bf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vfnmsub231bf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x87,0xbe,0xf0]
- vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vfnmsub231bf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vfnmsub231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmsub231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vfnmsub231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmsub231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmsub231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vfnmsub231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmsub231nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vfnmsub231bf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0xbe,0x35,0x00,0x00,0x00,0x00]
- vfnmsub231nepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vfnmsub231bf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vfnmsub231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vfnmsub231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0xbe,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vfnmsub231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vfnmsub231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vfnmsub231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xbe,0x71,0x7f]
- vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vfnmsub231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vfnmsub231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xbe,0x72,0x80]
- vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vfnmsub231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vfnmsub231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmsub231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vfnmsub231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmsub231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmsub231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vfnmsub231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmsub231nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vfnmsub231bf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0xbe,0x35,0x00,0x00,0x00,0x00]
- vfnmsub231nepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vfnmsub231bf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vfnmsub231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vfnmsub231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0xbe,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vfnmsub231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vfnmsub231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vfnmsub231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xbe,0x71,0x7f]
- vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vfnmsub231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vfnmsub231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xbe,0x72,0x80]
- vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vfnmsub231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vfnmsub231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vfnmsub231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vfnmsub231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vfnmsub231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vfnmsub231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vfnmsub231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00]
- vfnmsub231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vfnmsub231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vfnmsub231nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vfnmsub231bf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0xbe,0x35,0x00,0x00,0x00,0x00]
- vfnmsub231nepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vfnmsub231bf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vfnmsub231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vfnmsub231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0xbe,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vfnmsub231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vfnmsub231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vfnmsub231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0xbe,0x71,0x7f]
- vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vfnmsub231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vfnmsub231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0xbe,0x72,0x80]
- vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vfnmsub231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vfpclasspbf16 k5, zmm23, 123
+// CHECK: vfpclassbf16 k5, zmm23, 123
// CHECK: encoding: [0x62,0xb3,0x7f,0x48,0x66,0xef,0x7b]
- vfpclasspbf16 k5, zmm23, 123
+ vfpclassbf16 k5, zmm23, 123
-// CHECK: vfpclasspbf16 k5 {k7}, zmm23, 123
+// CHECK: vfpclassbf16 k5 {k7}, zmm23, 123
// CHECK: encoding: [0x62,0xb3,0x7f,0x4f,0x66,0xef,0x7b]
- vfpclasspbf16 k5 {k7}, zmm23, 123
+ vfpclassbf16 k5 {k7}, zmm23, 123
-// CHECK: vfpclasspbf16 k5, ymm23, 123
+// CHECK: vfpclassbf16 k5, ymm23, 123
// CHECK: encoding: [0x62,0xb3,0x7f,0x28,0x66,0xef,0x7b]
- vfpclasspbf16 k5, ymm23, 123
+ vfpclassbf16 k5, ymm23, 123
-// CHECK: vfpclasspbf16 k5 {k7}, ymm23, 123
+// CHECK: vfpclassbf16 k5 {k7}, ymm23, 123
// CHECK: encoding: [0x62,0xb3,0x7f,0x2f,0x66,0xef,0x7b]
- vfpclasspbf16 k5 {k7}, ymm23, 123
+ vfpclassbf16 k5 {k7}, ymm23, 123
-// CHECK: vfpclasspbf16 k5, xmm23, 123
+// CHECK: vfpclassbf16 k5, xmm23, 123
// CHECK: encoding: [0x62,0xb3,0x7f,0x08,0x66,0xef,0x7b]
- vfpclasspbf16 k5, xmm23, 123
+ vfpclassbf16 k5, xmm23, 123
-// CHECK: vfpclasspbf16 k5 {k7}, xmm23, 123
+// CHECK: vfpclassbf16 k5 {k7}, xmm23, 123
// CHECK: encoding: [0x62,0xb3,0x7f,0x0f,0x66,0xef,0x7b]
- vfpclasspbf16 k5 {k7}, xmm23, 123
+ vfpclassbf16 k5 {k7}, xmm23, 123
-// CHECK: vfpclasspbf16 k5, xmmword ptr [rbp + 8*r14 + 268435456], 123
+// CHECK: vfpclassbf16 k5, xmmword ptr [rbp + 8*r14 + 268435456], 123
// CHECK: encoding: [0x62,0xb3,0x7f,0x08,0x66,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vfpclasspbf16 k5, xmmword ptr [rbp + 8*r14 + 268435456], 123
+ vfpclassbf16 k5, xmmword ptr [rbp + 8*r14 + 268435456], 123
-// CHECK: vfpclasspbf16 k5 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
+// CHECK: vfpclassbf16 k5 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
// CHECK: encoding: [0x62,0xd3,0x7f,0x0f,0x66,0xac,0x80,0x23,0x01,0x00,0x00,0x7b]
- vfpclasspbf16 k5 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
+ vfpclassbf16 k5 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
-// CHECK: vfpclasspbf16 k5, word ptr [rip]{1to8}, 123
+// CHECK: vfpclassbf16 k5, word ptr [rip]{1to8}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b]
- vfpclasspbf16 k5, word ptr [rip]{1to8}, 123
+ vfpclassbf16 k5, word ptr [rip]{1to8}, 123
-// CHECK: vfpclasspbf16 k5, xmmword ptr [2*rbp - 512], 123
+// CHECK: vfpclassbf16 k5, xmmword ptr [2*rbp - 512], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vfpclasspbf16 k5, xmmword ptr [2*rbp - 512], 123
+ vfpclassbf16 k5, xmmword ptr [2*rbp - 512], 123
-// CHECK: vfpclasspbf16 k5 {k7}, xmmword ptr [rcx + 2032], 123
+// CHECK: vfpclassbf16 k5 {k7}, xmmword ptr [rcx + 2032], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0x69,0x7f,0x7b]
- vfpclasspbf16 k5 {k7}, xmmword ptr [rcx + 2032], 123
+ vfpclassbf16 k5 {k7}, xmmword ptr [rcx + 2032], 123
-// CHECK: vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to8}, 123
+// CHECK: vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to8}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x1f,0x66,0x6a,0x80,0x7b]
- vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to8}, 123
+ vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to8}, 123
-// CHECK: vfpclasspbf16 k5, word ptr [rip]{1to16}, 123
+// CHECK: vfpclassbf16 k5, word ptr [rip]{1to16}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b]
- vfpclasspbf16 k5, word ptr [rip]{1to16}, 123
+ vfpclassbf16 k5, word ptr [rip]{1to16}, 123
-// CHECK: vfpclasspbf16 k5, ymmword ptr [2*rbp - 1024], 123
+// CHECK: vfpclassbf16 k5, ymmword ptr [2*rbp - 1024], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x66,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vfpclasspbf16 k5, ymmword ptr [2*rbp - 1024], 123
+ vfpclassbf16 k5, ymmword ptr [2*rbp - 1024], 123
-// CHECK: vfpclasspbf16 k5 {k7}, ymmword ptr [rcx + 4064], 123
+// CHECK: vfpclassbf16 k5 {k7}, ymmword ptr [rcx + 4064], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x66,0x69,0x7f,0x7b]
- vfpclasspbf16 k5 {k7}, ymmword ptr [rcx + 4064], 123
+ vfpclassbf16 k5 {k7}, ymmword ptr [rcx + 4064], 123
-// CHECK: vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to16}, 123
+// CHECK: vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to16}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x3f,0x66,0x6a,0x80,0x7b]
- vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to16}, 123
+ vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to16}, 123
-// CHECK: vfpclasspbf16 k5, word ptr [rip]{1to32}, 123
+// CHECK: vfpclassbf16 k5, word ptr [rip]{1to32}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b]
- vfpclasspbf16 k5, word ptr [rip]{1to32}, 123
+ vfpclassbf16 k5, word ptr [rip]{1to32}, 123
-// CHECK: vfpclasspbf16 k5, zmmword ptr [2*rbp - 2048], 123
+// CHECK: vfpclassbf16 k5, zmmword ptr [2*rbp - 2048], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x66,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vfpclasspbf16 k5, zmmword ptr [2*rbp - 2048], 123
+ vfpclassbf16 k5, zmmword ptr [2*rbp - 2048], 123
-// CHECK: vfpclasspbf16 k5 {k7}, zmmword ptr [rcx + 8128], 123
+// CHECK: vfpclassbf16 k5 {k7}, zmmword ptr [rcx + 8128], 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x66,0x69,0x7f,0x7b]
- vfpclasspbf16 k5 {k7}, zmmword ptr [rcx + 8128], 123
+ vfpclassbf16 k5 {k7}, zmmword ptr [rcx + 8128], 123
-// CHECK: vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to32}, 123
+// CHECK: vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to32}, 123
// CHECK: encoding: [0x62,0xf3,0x7f,0x5f,0x66,0x6a,0x80,0x7b]
- vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to32}, 123
+ vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to32}, 123
-// CHECK: vgetexppbf16 xmm22, xmm23
+// CHECK: vgetexpbf16 xmm22, xmm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x42,0xf7]
- vgetexppbf16 xmm22, xmm23
+ vgetexpbf16 xmm22, xmm23
-// CHECK: vgetexppbf16 xmm22 {k7}, xmm23
+// CHECK: vgetexpbf16 xmm22 {k7}, xmm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x0f,0x42,0xf7]
- vgetexppbf16 xmm22 {k7}, xmm23
+ vgetexpbf16 xmm22 {k7}, xmm23
-// CHECK: vgetexppbf16 xmm22 {k7} {z}, xmm23
+// CHECK: vgetexpbf16 xmm22 {k7} {z}, xmm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x8f,0x42,0xf7]
- vgetexppbf16 xmm22 {k7} {z}, xmm23
+ vgetexpbf16 xmm22 {k7} {z}, xmm23
-// CHECK: vgetexppbf16 zmm22, zmm23
+// CHECK: vgetexpbf16 zmm22, zmm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x42,0xf7]
- vgetexppbf16 zmm22, zmm23
+ vgetexpbf16 zmm22, zmm23
-// CHECK: vgetexppbf16 zmm22 {k7}, zmm23
+// CHECK: vgetexpbf16 zmm22 {k7}, zmm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x4f,0x42,0xf7]
- vgetexppbf16 zmm22 {k7}, zmm23
+ vgetexpbf16 zmm22 {k7}, zmm23
-// CHECK: vgetexppbf16 zmm22 {k7} {z}, zmm23
+// CHECK: vgetexpbf16 zmm22 {k7} {z}, zmm23
// CHECK: encoding: [0x62,0xa5,0x7d,0xcf,0x42,0xf7]
- vgetexppbf16 zmm22 {k7} {z}, zmm23
+ vgetexpbf16 zmm22 {k7} {z}, zmm23
-// CHECK: vgetexppbf16 ymm22, ymm23
+// CHECK: vgetexpbf16 ymm22, ymm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x42,0xf7]
- vgetexppbf16 ymm22, ymm23
+ vgetexpbf16 ymm22, ymm23
-// CHECK: vgetexppbf16 ymm22 {k7}, ymm23
+// CHECK: vgetexpbf16 ymm22 {k7}, ymm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x2f,0x42,0xf7]
- vgetexppbf16 ymm22 {k7}, ymm23
+ vgetexpbf16 ymm22 {k7}, ymm23
-// CHECK: vgetexppbf16 ymm22 {k7} {z}, ymm23
+// CHECK: vgetexpbf16 ymm22 {k7} {z}, ymm23
// CHECK: encoding: [0x62,0xa5,0x7d,0xaf,0x42,0xf7]
- vgetexppbf16 ymm22 {k7} {z}, ymm23
+ vgetexpbf16 ymm22 {k7} {z}, ymm23
-// CHECK: vgetexppbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vgetexpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vgetexppbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
+ vgetexpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vgetexppbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vgetexpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x7d,0x0f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00]
- vgetexppbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
+ vgetexpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vgetexppbf16 xmm22, word ptr [rip]{1to8}
+// CHECK: vgetexpbf16 xmm22, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe5,0x7d,0x18,0x42,0x35,0x00,0x00,0x00,0x00]
- vgetexppbf16 xmm22, word ptr [rip]{1to8}
+ vgetexpbf16 xmm22, word ptr [rip]{1to8}
-// CHECK: vgetexppbf16 xmm22, xmmword ptr [2*rbp - 512]
+// CHECK: vgetexpbf16 xmm22, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe5,0x7d,0x08,0x42,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vgetexppbf16 xmm22, xmmword ptr [2*rbp - 512]
+ vgetexpbf16 xmm22, xmmword ptr [2*rbp - 512]
-// CHECK: vgetexppbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
+// CHECK: vgetexpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe5,0x7d,0x8f,0x42,0x71,0x7f]
- vgetexppbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
+ vgetexpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
-// CHECK: vgetexppbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
+// CHECK: vgetexpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe5,0x7d,0x9f,0x42,0x72,0x80]
- vgetexppbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
+ vgetexpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
-// CHECK: vgetexppbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vgetexpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vgetexppbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
+ vgetexpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vgetexppbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vgetexpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x7d,0x2f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00]
- vgetexppbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
+ vgetexpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vgetexppbf16 ymm22, word ptr [rip]{1to16}
+// CHECK: vgetexpbf16 ymm22, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe5,0x7d,0x38,0x42,0x35,0x00,0x00,0x00,0x00]
- vgetexppbf16 ymm22, word ptr [rip]{1to16}
+ vgetexpbf16 ymm22, word ptr [rip]{1to16}
-// CHECK: vgetexppbf16 ymm22, ymmword ptr [2*rbp - 1024]
+// CHECK: vgetexpbf16 ymm22, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe5,0x7d,0x28,0x42,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vgetexppbf16 ymm22, ymmword ptr [2*rbp - 1024]
+ vgetexpbf16 ymm22, ymmword ptr [2*rbp - 1024]
-// CHECK: vgetexppbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
+// CHECK: vgetexpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe5,0x7d,0xaf,0x42,0x71,0x7f]
- vgetexppbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
+ vgetexpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
-// CHECK: vgetexppbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
+// CHECK: vgetexpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe5,0x7d,0xbf,0x42,0x72,0x80]
- vgetexppbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
+ vgetexpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
-// CHECK: vgetexppbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vgetexpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vgetexppbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
+ vgetexpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vgetexppbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vgetexpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x7d,0x4f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00]
- vgetexppbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
+ vgetexpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vgetexppbf16 zmm22, word ptr [rip]{1to32}
+// CHECK: vgetexpbf16 zmm22, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe5,0x7d,0x58,0x42,0x35,0x00,0x00,0x00,0x00]
- vgetexppbf16 zmm22, word ptr [rip]{1to32}
+ vgetexpbf16 zmm22, word ptr [rip]{1to32}
-// CHECK: vgetexppbf16 zmm22, zmmword ptr [2*rbp - 2048]
+// CHECK: vgetexpbf16 zmm22, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe5,0x7d,0x48,0x42,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vgetexppbf16 zmm22, zmmword ptr [2*rbp - 2048]
+ vgetexpbf16 zmm22, zmmword ptr [2*rbp - 2048]
-// CHECK: vgetexppbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
+// CHECK: vgetexpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe5,0x7d,0xcf,0x42,0x71,0x7f]
- vgetexppbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
+ vgetexpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
-// CHECK: vgetexppbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
+// CHECK: vgetexpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe5,0x7d,0xdf,0x42,0x72,0x80]
- vgetexppbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
+ vgetexpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
-// CHECK: vgetmantpbf16 zmm22, zmm23, 123
+// CHECK: vgetmantbf16 zmm22, zmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x26,0xf7,0x7b]
- vgetmantpbf16 zmm22, zmm23, 123
+ vgetmantbf16 zmm22, zmm23, 123
-// CHECK: vgetmantpbf16 zmm22 {k7}, zmm23, 123
+// CHECK: vgetmantbf16 zmm22 {k7}, zmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x4f,0x26,0xf7,0x7b]
- vgetmantpbf16 zmm22 {k7}, zmm23, 123
+ vgetmantbf16 zmm22 {k7}, zmm23, 123
-// CHECK: vgetmantpbf16 zmm22 {k7} {z}, zmm23, 123
+// CHECK: vgetmantbf16 zmm22 {k7} {z}, zmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0xcf,0x26,0xf7,0x7b]
- vgetmantpbf16 zmm22 {k7} {z}, zmm23, 123
+ vgetmantbf16 zmm22 {k7} {z}, zmm23, 123
-// CHECK: vgetmantpbf16 ymm22, ymm23, 123
+// CHECK: vgetmantbf16 ymm22, ymm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x26,0xf7,0x7b]
- vgetmantpbf16 ymm22, ymm23, 123
+ vgetmantbf16 ymm22, ymm23, 123
-// CHECK: vgetmantpbf16 ymm22 {k7}, ymm23, 123
+// CHECK: vgetmantbf16 ymm22 {k7}, ymm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x2f,0x26,0xf7,0x7b]
- vgetmantpbf16 ymm22 {k7}, ymm23, 123
+ vgetmantbf16 ymm22 {k7}, ymm23, 123
-// CHECK: vgetmantpbf16 ymm22 {k7} {z}, ymm23, 123
+// CHECK: vgetmantbf16 ymm22 {k7} {z}, ymm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0xaf,0x26,0xf7,0x7b]
- vgetmantpbf16 ymm22 {k7} {z}, ymm23, 123
+ vgetmantbf16 ymm22 {k7} {z}, ymm23, 123
-// CHECK: vgetmantpbf16 xmm22, xmm23, 123
+// CHECK: vgetmantbf16 xmm22, xmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x26,0xf7,0x7b]
- vgetmantpbf16 xmm22, xmm23, 123
+ vgetmantbf16 xmm22, xmm23, 123
-// CHECK: vgetmantpbf16 xmm22 {k7}, xmm23, 123
+// CHECK: vgetmantbf16 xmm22 {k7}, xmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x0f,0x26,0xf7,0x7b]
- vgetmantpbf16 xmm22 {k7}, xmm23, 123
+ vgetmantbf16 xmm22 {k7}, xmm23, 123
-// CHECK: vgetmantpbf16 xmm22 {k7} {z}, xmm23, 123
+// CHECK: vgetmantbf16 xmm22 {k7} {z}, xmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x8f,0x26,0xf7,0x7b]
- vgetmantpbf16 xmm22 {k7} {z}, xmm23, 123
+ vgetmantbf16 xmm22 {k7} {z}, xmm23, 123
-// CHECK: vgetmantpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
+// CHECK: vgetmantbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vgetmantpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
+ vgetmantbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
-// CHECK: vgetmantpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
+// CHECK: vgetmantbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
// CHECK: encoding: [0x62,0xc3,0x7f,0x0f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vgetmantpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
+ vgetmantbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
-// CHECK: vgetmantpbf16 xmm22, word ptr [rip]{1to8}, 123
+// CHECK: vgetmantbf16 xmm22, word ptr [rip]{1to8}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x18,0x26,0x35,0x00,0x00,0x00,0x00,0x7b]
- vgetmantpbf16 xmm22, word ptr [rip]{1to8}, 123
+ vgetmantbf16 xmm22, word ptr [rip]{1to8}, 123
-// CHECK: vgetmantpbf16 xmm22, xmmword ptr [2*rbp - 512], 123
+// CHECK: vgetmantbf16 xmm22, xmmword ptr [2*rbp - 512], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x08,0x26,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vgetmantpbf16 xmm22, xmmword ptr [2*rbp - 512], 123
+ vgetmantbf16 xmm22, xmmword ptr [2*rbp - 512], 123
-// CHECK: vgetmantpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
+// CHECK: vgetmantbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x8f,0x26,0x71,0x7f,0x7b]
- vgetmantpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
+ vgetmantbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
-// CHECK: vgetmantpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
+// CHECK: vgetmantbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x9f,0x26,0x72,0x80,0x7b]
- vgetmantpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
+ vgetmantbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
-// CHECK: vgetmantpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
+// CHECK: vgetmantbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vgetmantpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
+ vgetmantbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
-// CHECK: vgetmantpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
+// CHECK: vgetmantbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
// CHECK: encoding: [0x62,0xc3,0x7f,0x2f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vgetmantpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
+ vgetmantbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
-// CHECK: vgetmantpbf16 ymm22, word ptr [rip]{1to16}, 123
+// CHECK: vgetmantbf16 ymm22, word ptr [rip]{1to16}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x38,0x26,0x35,0x00,0x00,0x00,0x00,0x7b]
- vgetmantpbf16 ymm22, word ptr [rip]{1to16}, 123
+ vgetmantbf16 ymm22, word ptr [rip]{1to16}, 123
-// CHECK: vgetmantpbf16 ymm22, ymmword ptr [2*rbp - 1024], 123
+// CHECK: vgetmantbf16 ymm22, ymmword ptr [2*rbp - 1024], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x28,0x26,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vgetmantpbf16 ymm22, ymmword ptr [2*rbp - 1024], 123
+ vgetmantbf16 ymm22, ymmword ptr [2*rbp - 1024], 123
-// CHECK: vgetmantpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
+// CHECK: vgetmantbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0xaf,0x26,0x71,0x7f,0x7b]
- vgetmantpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
+ vgetmantbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
-// CHECK: vgetmantpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
+// CHECK: vgetmantbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0xbf,0x26,0x72,0x80,0x7b]
- vgetmantpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
+ vgetmantbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
-// CHECK: vgetmantpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
+// CHECK: vgetmantbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vgetmantpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
+ vgetmantbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
-// CHECK: vgetmantpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
+// CHECK: vgetmantbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
// CHECK: encoding: [0x62,0xc3,0x7f,0x4f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vgetmantpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
+ vgetmantbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
-// CHECK: vgetmantpbf16 zmm22, word ptr [rip]{1to32}, 123
+// CHECK: vgetmantbf16 zmm22, word ptr [rip]{1to32}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x58,0x26,0x35,0x00,0x00,0x00,0x00,0x7b]
- vgetmantpbf16 zmm22, word ptr [rip]{1to32}, 123
+ vgetmantbf16 zmm22, word ptr [rip]{1to32}, 123
-// CHECK: vgetmantpbf16 zmm22, zmmword ptr [2*rbp - 2048], 123
+// CHECK: vgetmantbf16 zmm22, zmmword ptr [2*rbp - 2048], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x48,0x26,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vgetmantpbf16 zmm22, zmmword ptr [2*rbp - 2048], 123
+ vgetmantbf16 zmm22, zmmword ptr [2*rbp - 2048], 123
-// CHECK: vgetmantpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
+// CHECK: vgetmantbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0xcf,0x26,0x71,0x7f,0x7b]
- vgetmantpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
+ vgetmantbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
-// CHECK: vgetmantpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
+// CHECK: vgetmantbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0xdf,0x26,0x72,0x80,0x7b]
- vgetmantpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
+ vgetmantbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
-// CHECK: vmaxpbf16 ymm22, ymm23, ymm24
+// CHECK: vmaxbf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0x20,0x5f,0xf0]
- vmaxpbf16 ymm22, ymm23, ymm24
+ vmaxbf16 ymm22, ymm23, ymm24
-// CHECK: vmaxpbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vmaxbf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0x27,0x5f,0xf0]
- vmaxpbf16 ymm22 {k7}, ymm23, ymm24
+ vmaxbf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vmaxpbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vmaxbf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5f,0xf0]
- vmaxpbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vmaxbf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vmaxpbf16 zmm22, zmm23, zmm24
+// CHECK: vmaxbf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0x40,0x5f,0xf0]
- vmaxpbf16 zmm22, zmm23, zmm24
+ vmaxbf16 zmm22, zmm23, zmm24
-// CHECK: vmaxpbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vmaxbf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0x47,0x5f,0xf0]
- vmaxpbf16 zmm22 {k7}, zmm23, zmm24
+ vmaxbf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vmaxpbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vmaxbf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5f,0xf0]
- vmaxpbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vmaxbf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vmaxpbf16 xmm22, xmm23, xmm24
+// CHECK: vmaxbf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x00,0x5f,0xf0]
- vmaxpbf16 xmm22, xmm23, xmm24
+ vmaxbf16 xmm22, xmm23, xmm24
-// CHECK: vmaxpbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vmaxbf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x07,0x5f,0xf0]
- vmaxpbf16 xmm22 {k7}, xmm23, xmm24
+ vmaxbf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vmaxpbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vmaxbf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x87,0x5f,0xf0]
- vmaxpbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vmaxbf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vmaxpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vmaxbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vmaxpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vmaxbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vmaxpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vmaxbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00]
- vmaxpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vmaxbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vmaxpbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vmaxbf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5f,0x35,0x00,0x00,0x00,0x00]
- vmaxpbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vmaxbf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vmaxpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vmaxbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5f,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vmaxpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vmaxbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vmaxpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vmaxbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5f,0x71,0x7f]
- vmaxpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vmaxbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vmaxpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vmaxbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5f,0x72,0x80]
- vmaxpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vmaxbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vmaxpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vmaxbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vmaxpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vmaxbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vmaxpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vmaxbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00]
- vmaxpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vmaxbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vmaxpbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vmaxbf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5f,0x35,0x00,0x00,0x00,0x00]
- vmaxpbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vmaxbf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vmaxpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vmaxbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5f,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vmaxpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vmaxbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vmaxpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vmaxbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5f,0x71,0x7f]
- vmaxpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vmaxbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vmaxpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vmaxbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5f,0x72,0x80]
- vmaxpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vmaxbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vmaxpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vmaxbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vmaxpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vmaxbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vmaxpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vmaxbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00]
- vmaxpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vmaxbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vmaxpbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vmaxbf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5f,0x35,0x00,0x00,0x00,0x00]
- vmaxpbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vmaxbf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vmaxpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vmaxbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5f,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vmaxpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vmaxbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vmaxpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vmaxbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5f,0x71,0x7f]
- vmaxpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vmaxbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vmaxpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vmaxbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5f,0x72,0x80]
- vmaxpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vmaxbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vminpbf16 ymm22, ymm23, ymm24
+// CHECK: vminbf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0x20,0x5d,0xf0]
- vminpbf16 ymm22, ymm23, ymm24
+ vminbf16 ymm22, ymm23, ymm24
-// CHECK: vminpbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vminbf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0x27,0x5d,0xf0]
- vminpbf16 ymm22 {k7}, ymm23, ymm24
+ vminbf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vminpbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vminbf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5d,0xf0]
- vminpbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vminbf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vminpbf16 zmm22, zmm23, zmm24
+// CHECK: vminbf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0x40,0x5d,0xf0]
- vminpbf16 zmm22, zmm23, zmm24
+ vminbf16 zmm22, zmm23, zmm24
-// CHECK: vminpbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vminbf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0x47,0x5d,0xf0]
- vminpbf16 zmm22 {k7}, zmm23, zmm24
+ vminbf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vminpbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vminbf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5d,0xf0]
- vminpbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vminbf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vminpbf16 xmm22, xmm23, xmm24
+// CHECK: vminbf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x00,0x5d,0xf0]
- vminpbf16 xmm22, xmm23, xmm24
+ vminbf16 xmm22, xmm23, xmm24
-// CHECK: vminpbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vminbf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x07,0x5d,0xf0]
- vminpbf16 xmm22 {k7}, xmm23, xmm24
+ vminbf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vminpbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vminbf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x87,0x5d,0xf0]
- vminpbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vminbf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vminpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vminbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vminpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vminbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vminpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vminbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00]
- vminpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vminbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vminpbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vminbf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5d,0x35,0x00,0x00,0x00,0x00]
- vminpbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vminbf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vminpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vminbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5d,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vminpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vminbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vminpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vminbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5d,0x71,0x7f]
- vminpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vminbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vminpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vminbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5d,0x72,0x80]
- vminpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vminbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vminpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vminbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vminpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vminbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vminpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vminbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00]
- vminpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vminbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vminpbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vminbf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5d,0x35,0x00,0x00,0x00,0x00]
- vminpbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vminbf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vminpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vminbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5d,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vminpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vminbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vminpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vminbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5d,0x71,0x7f]
- vminpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vminbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vminpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vminbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5d,0x72,0x80]
- vminpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vminbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vminpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vminbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vminpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vminbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vminpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vminbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00]
- vminpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vminbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vminpbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vminbf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5d,0x35,0x00,0x00,0x00,0x00]
- vminpbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vminbf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vminpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vminbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5d,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vminpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vminbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vminpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vminbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5d,0x71,0x7f]
- vminpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vminbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vminpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vminbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5d,0x72,0x80]
- vminpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vminbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vmulnepbf16 ymm22, ymm23, ymm24
+// CHECK: vmulbf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0x20,0x59,0xf0]
- vmulnepbf16 ymm22, ymm23, ymm24
+ vmulbf16 ymm22, ymm23, ymm24
-// CHECK: vmulnepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vmulbf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0x27,0x59,0xf0]
- vmulnepbf16 ymm22 {k7}, ymm23, ymm24
+ vmulbf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vmulnepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vmulbf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0xa7,0x59,0xf0]
- vmulnepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vmulbf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vmulnepbf16 zmm22, zmm23, zmm24
+// CHECK: vmulbf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0x40,0x59,0xf0]
- vmulnepbf16 zmm22, zmm23, zmm24
+ vmulbf16 zmm22, zmm23, zmm24
-// CHECK: vmulnepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vmulbf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0x47,0x59,0xf0]
- vmulnepbf16 zmm22 {k7}, zmm23, zmm24
+ vmulbf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vmulnepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vmulbf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0xc7,0x59,0xf0]
- vmulnepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vmulbf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vmulnepbf16 xmm22, xmm23, xmm24
+// CHECK: vmulbf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x00,0x59,0xf0]
- vmulnepbf16 xmm22, xmm23, xmm24
+ vmulbf16 xmm22, xmm23, xmm24
-// CHECK: vmulnepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vmulbf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x07,0x59,0xf0]
- vmulnepbf16 xmm22 {k7}, xmm23, xmm24
+ vmulbf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vmulnepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vmulbf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x87,0x59,0xf0]
- vmulnepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vmulbf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vmulnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vmulbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x40,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vmulnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vmulbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vmulnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vmulbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x47,0x59,0xb4,0x80,0x23,0x01,0x00,0x00]
- vmulnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vmulbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vmulnepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vmulbf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe5,0x45,0x50,0x59,0x35,0x00,0x00,0x00,0x00]
- vmulnepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vmulbf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vmulnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vmulbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe5,0x45,0x40,0x59,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vmulnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vmulbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vmulnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vmulbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x59,0x71,0x7f]
- vmulnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vmulbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vmulnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vmulbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x59,0x72,0x80]
- vmulnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vmulbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vmulnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vmulbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x20,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vmulnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vmulbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vmulnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vmulbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x27,0x59,0xb4,0x80,0x23,0x01,0x00,0x00]
- vmulnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vmulbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vmulnepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vmulbf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe5,0x45,0x30,0x59,0x35,0x00,0x00,0x00,0x00]
- vmulnepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vmulbf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vmulnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vmulbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe5,0x45,0x20,0x59,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vmulnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vmulbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vmulnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vmulbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x59,0x71,0x7f]
- vmulnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vmulbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vmulnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vmulbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x59,0x72,0x80]
- vmulnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vmulbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vmulnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vmulbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x00,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vmulnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vmulbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vmulnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vmulbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x07,0x59,0xb4,0x80,0x23,0x01,0x00,0x00]
- vmulnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vmulbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vmulnepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vmulbf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe5,0x45,0x10,0x59,0x35,0x00,0x00,0x00,0x00]
- vmulnepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vmulbf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vmulnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vmulbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe5,0x45,0x00,0x59,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vmulnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vmulbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vmulnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vmulbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe5,0x45,0x87,0x59,0x71,0x7f]
- vmulnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vmulbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vmulnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vmulbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe5,0x45,0x97,0x59,0x72,0x80]
- vmulnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vmulbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vrcppbf16 xmm22, xmm23
+// CHECK: vrcpbf16 xmm22, xmm23
// CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4c,0xf7]
- vrcppbf16 xmm22, xmm23
+ vrcpbf16 xmm22, xmm23
-// CHECK: vrcppbf16 xmm22 {k7}, xmm23
+// CHECK: vrcpbf16 xmm22 {k7}, xmm23
// CHECK: encoding: [0x62,0xa6,0x7c,0x0f,0x4c,0xf7]
- vrcppbf16 xmm22 {k7}, xmm23
+ vrcpbf16 xmm22 {k7}, xmm23
-// CHECK: vrcppbf16 xmm22 {k7} {z}, xmm23
+// CHECK: vrcpbf16 xmm22 {k7} {z}, xmm23
// CHECK: encoding: [0x62,0xa6,0x7c,0x8f,0x4c,0xf7]
- vrcppbf16 xmm22 {k7} {z}, xmm23
+ vrcpbf16 xmm22 {k7} {z}, xmm23
-// CHECK: vrcppbf16 zmm22, zmm23
+// CHECK: vrcpbf16 zmm22, zmm23
// CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4c,0xf7]
- vrcppbf16 zmm22, zmm23
+ vrcpbf16 zmm22, zmm23
-// CHECK: vrcppbf16 zmm22 {k7}, zmm23
+// CHECK: vrcpbf16 zmm22 {k7}, zmm23
// CHECK: encoding: [0x62,0xa6,0x7c,0x4f,0x4c,0xf7]
- vrcppbf16 zmm22 {k7}, zmm23
+ vrcpbf16 zmm22 {k7}, zmm23
-// CHECK: vrcppbf16 zmm22 {k7} {z}, zmm23
+// CHECK: vrcpbf16 zmm22 {k7} {z}, zmm23
// CHECK: encoding: [0x62,0xa6,0x7c,0xcf,0x4c,0xf7]
- vrcppbf16 zmm22 {k7} {z}, zmm23
+ vrcpbf16 zmm22 {k7} {z}, zmm23
-// CHECK: vrcppbf16 ymm22, ymm23
+// CHECK: vrcpbf16 ymm22, ymm23
// CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4c,0xf7]
- vrcppbf16 ymm22, ymm23
+ vrcpbf16 ymm22, ymm23
-// CHECK: vrcppbf16 ymm22 {k7}, ymm23
+// CHECK: vrcpbf16 ymm22 {k7}, ymm23
// CHECK: encoding: [0x62,0xa6,0x7c,0x2f,0x4c,0xf7]
- vrcppbf16 ymm22 {k7}, ymm23
+ vrcpbf16 ymm22 {k7}, ymm23
-// CHECK: vrcppbf16 ymm22 {k7} {z}, ymm23
+// CHECK: vrcpbf16 ymm22 {k7} {z}, ymm23
// CHECK: encoding: [0x62,0xa6,0x7c,0xaf,0x4c,0xf7]
- vrcppbf16 ymm22 {k7} {z}, ymm23
+ vrcpbf16 ymm22 {k7} {z}, ymm23
-// CHECK: vrcppbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vrcpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vrcppbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
+ vrcpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vrcppbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vrcpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x7c,0x0f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vrcppbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
+ vrcpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vrcppbf16 xmm22, word ptr [rip]{1to8}
+// CHECK: vrcpbf16 xmm22, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x7c,0x18,0x4c,0x35,0x00,0x00,0x00,0x00]
- vrcppbf16 xmm22, word ptr [rip]{1to8}
+ vrcpbf16 xmm22, word ptr [rip]{1to8}
-// CHECK: vrcppbf16 xmm22, xmmword ptr [2*rbp - 512]
+// CHECK: vrcpbf16 xmm22, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x7c,0x08,0x4c,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vrcppbf16 xmm22, xmmword ptr [2*rbp - 512]
+ vrcpbf16 xmm22, xmmword ptr [2*rbp - 512]
-// CHECK: vrcppbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
+// CHECK: vrcpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x7c,0x8f,0x4c,0x71,0x7f]
- vrcppbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
+ vrcpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
-// CHECK: vrcppbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
+// CHECK: vrcpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x7c,0x9f,0x4c,0x72,0x80]
- vrcppbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
+ vrcpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
-// CHECK: vrcppbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vrcpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vrcppbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
+ vrcpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vrcppbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vrcpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x7c,0x2f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vrcppbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
+ vrcpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vrcppbf16 ymm22, word ptr [rip]{1to16}
+// CHECK: vrcpbf16 ymm22, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x7c,0x38,0x4c,0x35,0x00,0x00,0x00,0x00]
- vrcppbf16 ymm22, word ptr [rip]{1to16}
+ vrcpbf16 ymm22, word ptr [rip]{1to16}
-// CHECK: vrcppbf16 ymm22, ymmword ptr [2*rbp - 1024]
+// CHECK: vrcpbf16 ymm22, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x7c,0x28,0x4c,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vrcppbf16 ymm22, ymmword ptr [2*rbp - 1024]
+ vrcpbf16 ymm22, ymmword ptr [2*rbp - 1024]
-// CHECK: vrcppbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
+// CHECK: vrcpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x7c,0xaf,0x4c,0x71,0x7f]
- vrcppbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
+ vrcpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
-// CHECK: vrcppbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
+// CHECK: vrcpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x7c,0xbf,0x4c,0x72,0x80]
- vrcppbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
+ vrcpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
-// CHECK: vrcppbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vrcpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vrcppbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
+ vrcpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vrcppbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vrcpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x7c,0x4f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vrcppbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
+ vrcpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vrcppbf16 zmm22, word ptr [rip]{1to32}
+// CHECK: vrcpbf16 zmm22, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x7c,0x58,0x4c,0x35,0x00,0x00,0x00,0x00]
- vrcppbf16 zmm22, word ptr [rip]{1to32}
+ vrcpbf16 zmm22, word ptr [rip]{1to32}
-// CHECK: vrcppbf16 zmm22, zmmword ptr [2*rbp - 2048]
+// CHECK: vrcpbf16 zmm22, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x7c,0x48,0x4c,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vrcppbf16 zmm22, zmmword ptr [2*rbp - 2048]
+ vrcpbf16 zmm22, zmmword ptr [2*rbp - 2048]
-// CHECK: vrcppbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
+// CHECK: vrcpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x7c,0xcf,0x4c,0x71,0x7f]
- vrcppbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
+ vrcpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
-// CHECK: vrcppbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
+// CHECK: vrcpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x7c,0xdf,0x4c,0x72,0x80]
- vrcppbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
+ vrcpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
-// CHECK: vreducenepbf16 zmm22, zmm23, 123
+// CHECK: vreducebf16 zmm22, zmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x56,0xf7,0x7b]
- vreducenepbf16 zmm22, zmm23, 123
+ vreducebf16 zmm22, zmm23, 123
-// CHECK: vreducenepbf16 zmm22 {k7}, zmm23, 123
+// CHECK: vreducebf16 zmm22 {k7}, zmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x4f,0x56,0xf7,0x7b]
- vreducenepbf16 zmm22 {k7}, zmm23, 123
+ vreducebf16 zmm22 {k7}, zmm23, 123
-// CHECK: vreducenepbf16 zmm22 {k7} {z}, zmm23, 123
+// CHECK: vreducebf16 zmm22 {k7} {z}, zmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0xcf,0x56,0xf7,0x7b]
- vreducenepbf16 zmm22 {k7} {z}, zmm23, 123
+ vreducebf16 zmm22 {k7} {z}, zmm23, 123
-// CHECK: vreducenepbf16 ymm22, ymm23, 123
+// CHECK: vreducebf16 ymm22, ymm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x56,0xf7,0x7b]
- vreducenepbf16 ymm22, ymm23, 123
+ vreducebf16 ymm22, ymm23, 123
-// CHECK: vreducenepbf16 ymm22 {k7}, ymm23, 123
+// CHECK: vreducebf16 ymm22 {k7}, ymm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x2f,0x56,0xf7,0x7b]
- vreducenepbf16 ymm22 {k7}, ymm23, 123
+ vreducebf16 ymm22 {k7}, ymm23, 123
-// CHECK: vreducenepbf16 ymm22 {k7} {z}, ymm23, 123
+// CHECK: vreducebf16 ymm22 {k7} {z}, ymm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0xaf,0x56,0xf7,0x7b]
- vreducenepbf16 ymm22 {k7} {z}, ymm23, 123
+ vreducebf16 ymm22 {k7} {z}, ymm23, 123
-// CHECK: vreducenepbf16 xmm22, xmm23, 123
+// CHECK: vreducebf16 xmm22, xmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x56,0xf7,0x7b]
- vreducenepbf16 xmm22, xmm23, 123
+ vreducebf16 xmm22, xmm23, 123
-// CHECK: vreducenepbf16 xmm22 {k7}, xmm23, 123
+// CHECK: vreducebf16 xmm22 {k7}, xmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x0f,0x56,0xf7,0x7b]
- vreducenepbf16 xmm22 {k7}, xmm23, 123
+ vreducebf16 xmm22 {k7}, xmm23, 123
-// CHECK: vreducenepbf16 xmm22 {k7} {z}, xmm23, 123
+// CHECK: vreducebf16 xmm22 {k7} {z}, xmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x8f,0x56,0xf7,0x7b]
- vreducenepbf16 xmm22 {k7} {z}, xmm23, 123
+ vreducebf16 xmm22 {k7} {z}, xmm23, 123
-// CHECK: vreducenepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
+// CHECK: vreducebf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vreducenepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
+ vreducebf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
-// CHECK: vreducenepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
+// CHECK: vreducebf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
// CHECK: encoding: [0x62,0xc3,0x7f,0x0f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vreducenepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
+ vreducebf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
-// CHECK: vreducenepbf16 xmm22, word ptr [rip]{1to8}, 123
+// CHECK: vreducebf16 xmm22, word ptr [rip]{1to8}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x18,0x56,0x35,0x00,0x00,0x00,0x00,0x7b]
- vreducenepbf16 xmm22, word ptr [rip]{1to8}, 123
+ vreducebf16 xmm22, word ptr [rip]{1to8}, 123
-// CHECK: vreducenepbf16 xmm22, xmmword ptr [2*rbp - 512], 123
+// CHECK: vreducebf16 xmm22, xmmword ptr [2*rbp - 512], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x08,0x56,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vreducenepbf16 xmm22, xmmword ptr [2*rbp - 512], 123
+ vreducebf16 xmm22, xmmword ptr [2*rbp - 512], 123
-// CHECK: vreducenepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
+// CHECK: vreducebf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x8f,0x56,0x71,0x7f,0x7b]
- vreducenepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
+ vreducebf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
-// CHECK: vreducenepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
+// CHECK: vreducebf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x9f,0x56,0x72,0x80,0x7b]
- vreducenepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
+ vreducebf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
-// CHECK: vreducenepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
+// CHECK: vreducebf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vreducenepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
+ vreducebf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
-// CHECK: vreducenepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
+// CHECK: vreducebf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
// CHECK: encoding: [0x62,0xc3,0x7f,0x2f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vreducenepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
+ vreducebf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
-// CHECK: vreducenepbf16 ymm22, word ptr [rip]{1to16}, 123
+// CHECK: vreducebf16 ymm22, word ptr [rip]{1to16}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x38,0x56,0x35,0x00,0x00,0x00,0x00,0x7b]
- vreducenepbf16 ymm22, word ptr [rip]{1to16}, 123
+ vreducebf16 ymm22, word ptr [rip]{1to16}, 123
-// CHECK: vreducenepbf16 ymm22, ymmword ptr [2*rbp - 1024], 123
+// CHECK: vreducebf16 ymm22, ymmword ptr [2*rbp - 1024], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x28,0x56,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vreducenepbf16 ymm22, ymmword ptr [2*rbp - 1024], 123
+ vreducebf16 ymm22, ymmword ptr [2*rbp - 1024], 123
-// CHECK: vreducenepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
+// CHECK: vreducebf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0xaf,0x56,0x71,0x7f,0x7b]
- vreducenepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
+ vreducebf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
-// CHECK: vreducenepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
+// CHECK: vreducebf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0xbf,0x56,0x72,0x80,0x7b]
- vreducenepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
+ vreducebf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
-// CHECK: vreducenepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
+// CHECK: vreducebf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vreducenepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
+ vreducebf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
-// CHECK: vreducenepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
+// CHECK: vreducebf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
// CHECK: encoding: [0x62,0xc3,0x7f,0x4f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vreducenepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
+ vreducebf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
-// CHECK: vreducenepbf16 zmm22, word ptr [rip]{1to32}, 123
+// CHECK: vreducebf16 zmm22, word ptr [rip]{1to32}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x58,0x56,0x35,0x00,0x00,0x00,0x00,0x7b]
- vreducenepbf16 zmm22, word ptr [rip]{1to32}, 123
+ vreducebf16 zmm22, word ptr [rip]{1to32}, 123
-// CHECK: vreducenepbf16 zmm22, zmmword ptr [2*rbp - 2048], 123
+// CHECK: vreducebf16 zmm22, zmmword ptr [2*rbp - 2048], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x48,0x56,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vreducenepbf16 zmm22, zmmword ptr [2*rbp - 2048], 123
+ vreducebf16 zmm22, zmmword ptr [2*rbp - 2048], 123
-// CHECK: vreducenepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
+// CHECK: vreducebf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0xcf,0x56,0x71,0x7f,0x7b]
- vreducenepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
+ vreducebf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
-// CHECK: vreducenepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
+// CHECK: vreducebf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0xdf,0x56,0x72,0x80,0x7b]
- vreducenepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
+ vreducebf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
-// CHECK: vrndscalenepbf16 zmm22, zmm23, 123
+// CHECK: vrndscalebf16 zmm22, zmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x08,0xf7,0x7b]
- vrndscalenepbf16 zmm22, zmm23, 123
+ vrndscalebf16 zmm22, zmm23, 123
-// CHECK: vrndscalenepbf16 zmm22 {k7}, zmm23, 123
+// CHECK: vrndscalebf16 zmm22 {k7}, zmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x4f,0x08,0xf7,0x7b]
- vrndscalenepbf16 zmm22 {k7}, zmm23, 123
+ vrndscalebf16 zmm22 {k7}, zmm23, 123
-// CHECK: vrndscalenepbf16 zmm22 {k7} {z}, zmm23, 123
+// CHECK: vrndscalebf16 zmm22 {k7} {z}, zmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0xcf,0x08,0xf7,0x7b]
- vrndscalenepbf16 zmm22 {k7} {z}, zmm23, 123
+ vrndscalebf16 zmm22 {k7} {z}, zmm23, 123
-// CHECK: vrndscalenepbf16 ymm22, ymm23, 123
+// CHECK: vrndscalebf16 ymm22, ymm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x08,0xf7,0x7b]
- vrndscalenepbf16 ymm22, ymm23, 123
+ vrndscalebf16 ymm22, ymm23, 123
-// CHECK: vrndscalenepbf16 ymm22 {k7}, ymm23, 123
+// CHECK: vrndscalebf16 ymm22 {k7}, ymm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x2f,0x08,0xf7,0x7b]
- vrndscalenepbf16 ymm22 {k7}, ymm23, 123
+ vrndscalebf16 ymm22 {k7}, ymm23, 123
-// CHECK: vrndscalenepbf16 ymm22 {k7} {z}, ymm23, 123
+// CHECK: vrndscalebf16 ymm22 {k7} {z}, ymm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0xaf,0x08,0xf7,0x7b]
- vrndscalenepbf16 ymm22 {k7} {z}, ymm23, 123
+ vrndscalebf16 ymm22 {k7} {z}, ymm23, 123
-// CHECK: vrndscalenepbf16 xmm22, xmm23, 123
+// CHECK: vrndscalebf16 xmm22, xmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x08,0xf7,0x7b]
- vrndscalenepbf16 xmm22, xmm23, 123
+ vrndscalebf16 xmm22, xmm23, 123
-// CHECK: vrndscalenepbf16 xmm22 {k7}, xmm23, 123
+// CHECK: vrndscalebf16 xmm22 {k7}, xmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x0f,0x08,0xf7,0x7b]
- vrndscalenepbf16 xmm22 {k7}, xmm23, 123
+ vrndscalebf16 xmm22 {k7}, xmm23, 123
-// CHECK: vrndscalenepbf16 xmm22 {k7} {z}, xmm23, 123
+// CHECK: vrndscalebf16 xmm22 {k7} {z}, xmm23, 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x8f,0x08,0xf7,0x7b]
- vrndscalenepbf16 xmm22 {k7} {z}, xmm23, 123
+ vrndscalebf16 xmm22 {k7} {z}, xmm23, 123
-// CHECK: vrndscalenepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
+// CHECK: vrndscalebf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vrndscalenepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
+ vrndscalebf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123
-// CHECK: vrndscalenepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
+// CHECK: vrndscalebf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
// CHECK: encoding: [0x62,0xc3,0x7f,0x0f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vrndscalenepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
+ vrndscalebf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123
-// CHECK: vrndscalenepbf16 xmm22, word ptr [rip]{1to8}, 123
+// CHECK: vrndscalebf16 xmm22, word ptr [rip]{1to8}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x18,0x08,0x35,0x00,0x00,0x00,0x00,0x7b]
- vrndscalenepbf16 xmm22, word ptr [rip]{1to8}, 123
+ vrndscalebf16 xmm22, word ptr [rip]{1to8}, 123
-// CHECK: vrndscalenepbf16 xmm22, xmmword ptr [2*rbp - 512], 123
+// CHECK: vrndscalebf16 xmm22, xmmword ptr [2*rbp - 512], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x08,0x08,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b]
- vrndscalenepbf16 xmm22, xmmword ptr [2*rbp - 512], 123
+ vrndscalebf16 xmm22, xmmword ptr [2*rbp - 512], 123
-// CHECK: vrndscalenepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
+// CHECK: vrndscalebf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x8f,0x08,0x71,0x7f,0x7b]
- vrndscalenepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
+ vrndscalebf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123
-// CHECK: vrndscalenepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
+// CHECK: vrndscalebf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x9f,0x08,0x72,0x80,0x7b]
- vrndscalenepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
+ vrndscalebf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123
-// CHECK: vrndscalenepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
+// CHECK: vrndscalebf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vrndscalenepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
+ vrndscalebf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123
-// CHECK: vrndscalenepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
+// CHECK: vrndscalebf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
// CHECK: encoding: [0x62,0xc3,0x7f,0x2f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vrndscalenepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
+ vrndscalebf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123
-// CHECK: vrndscalenepbf16 ymm22, word ptr [rip]{1to16}, 123
+// CHECK: vrndscalebf16 ymm22, word ptr [rip]{1to16}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x38,0x08,0x35,0x00,0x00,0x00,0x00,0x7b]
- vrndscalenepbf16 ymm22, word ptr [rip]{1to16}, 123
+ vrndscalebf16 ymm22, word ptr [rip]{1to16}, 123
-// CHECK: vrndscalenepbf16 ymm22, ymmword ptr [2*rbp - 1024], 123
+// CHECK: vrndscalebf16 ymm22, ymmword ptr [2*rbp - 1024], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x28,0x08,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b]
- vrndscalenepbf16 ymm22, ymmword ptr [2*rbp - 1024], 123
+ vrndscalebf16 ymm22, ymmword ptr [2*rbp - 1024], 123
-// CHECK: vrndscalenepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
+// CHECK: vrndscalebf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0xaf,0x08,0x71,0x7f,0x7b]
- vrndscalenepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
+ vrndscalebf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123
-// CHECK: vrndscalenepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
+// CHECK: vrndscalebf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0xbf,0x08,0x72,0x80,0x7b]
- vrndscalenepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
+ vrndscalebf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123
-// CHECK: vrndscalenepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
+// CHECK: vrndscalebf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
// CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b]
- vrndscalenepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
+ vrndscalebf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123
-// CHECK: vrndscalenepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
+// CHECK: vrndscalebf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
// CHECK: encoding: [0x62,0xc3,0x7f,0x4f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b]
- vrndscalenepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
+ vrndscalebf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123
-// CHECK: vrndscalenepbf16 zmm22, word ptr [rip]{1to32}, 123
+// CHECK: vrndscalebf16 zmm22, word ptr [rip]{1to32}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x58,0x08,0x35,0x00,0x00,0x00,0x00,0x7b]
- vrndscalenepbf16 zmm22, word ptr [rip]{1to32}, 123
+ vrndscalebf16 zmm22, word ptr [rip]{1to32}, 123
-// CHECK: vrndscalenepbf16 zmm22, zmmword ptr [2*rbp - 2048], 123
+// CHECK: vrndscalebf16 zmm22, zmmword ptr [2*rbp - 2048], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0x48,0x08,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b]
- vrndscalenepbf16 zmm22, zmmword ptr [2*rbp - 2048], 123
+ vrndscalebf16 zmm22, zmmword ptr [2*rbp - 2048], 123
-// CHECK: vrndscalenepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
+// CHECK: vrndscalebf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
// CHECK: encoding: [0x62,0xe3,0x7f,0xcf,0x08,0x71,0x7f,0x7b]
- vrndscalenepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
+ vrndscalebf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123
-// CHECK: vrndscalenepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
+// CHECK: vrndscalebf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
// CHECK: encoding: [0x62,0xe3,0x7f,0xdf,0x08,0x72,0x80,0x7b]
- vrndscalenepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
+ vrndscalebf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123
-// CHECK: vrsqrtpbf16 xmm22, xmm23
+// CHECK: vrsqrtbf16 xmm22, xmm23
// CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4e,0xf7]
- vrsqrtpbf16 xmm22, xmm23
+ vrsqrtbf16 xmm22, xmm23
-// CHECK: vrsqrtpbf16 xmm22 {k7}, xmm23
+// CHECK: vrsqrtbf16 xmm22 {k7}, xmm23
// CHECK: encoding: [0x62,0xa6,0x7c,0x0f,0x4e,0xf7]
- vrsqrtpbf16 xmm22 {k7}, xmm23
+ vrsqrtbf16 xmm22 {k7}, xmm23
-// CHECK: vrsqrtpbf16 xmm22 {k7} {z}, xmm23
+// CHECK: vrsqrtbf16 xmm22 {k7} {z}, xmm23
// CHECK: encoding: [0x62,0xa6,0x7c,0x8f,0x4e,0xf7]
- vrsqrtpbf16 xmm22 {k7} {z}, xmm23
+ vrsqrtbf16 xmm22 {k7} {z}, xmm23
-// CHECK: vrsqrtpbf16 zmm22, zmm23
+// CHECK: vrsqrtbf16 zmm22, zmm23
// CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4e,0xf7]
- vrsqrtpbf16 zmm22, zmm23
+ vrsqrtbf16 zmm22, zmm23
-// CHECK: vrsqrtpbf16 zmm22 {k7}, zmm23
+// CHECK: vrsqrtbf16 zmm22 {k7}, zmm23
// CHECK: encoding: [0x62,0xa6,0x7c,0x4f,0x4e,0xf7]
- vrsqrtpbf16 zmm22 {k7}, zmm23
+ vrsqrtbf16 zmm22 {k7}, zmm23
-// CHECK: vrsqrtpbf16 zmm22 {k7} {z}, zmm23
+// CHECK: vrsqrtbf16 zmm22 {k7} {z}, zmm23
// CHECK: encoding: [0x62,0xa6,0x7c,0xcf,0x4e,0xf7]
- vrsqrtpbf16 zmm22 {k7} {z}, zmm23
+ vrsqrtbf16 zmm22 {k7} {z}, zmm23
-// CHECK: vrsqrtpbf16 ymm22, ymm23
+// CHECK: vrsqrtbf16 ymm22, ymm23
// CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4e,0xf7]
- vrsqrtpbf16 ymm22, ymm23
+ vrsqrtbf16 ymm22, ymm23
-// CHECK: vrsqrtpbf16 ymm22 {k7}, ymm23
+// CHECK: vrsqrtbf16 ymm22 {k7}, ymm23
// CHECK: encoding: [0x62,0xa6,0x7c,0x2f,0x4e,0xf7]
- vrsqrtpbf16 ymm22 {k7}, ymm23
+ vrsqrtbf16 ymm22 {k7}, ymm23
-// CHECK: vrsqrtpbf16 ymm22 {k7} {z}, ymm23
+// CHECK: vrsqrtbf16 ymm22 {k7} {z}, ymm23
// CHECK: encoding: [0x62,0xa6,0x7c,0xaf,0x4e,0xf7]
- vrsqrtpbf16 ymm22 {k7} {z}, ymm23
+ vrsqrtbf16 ymm22 {k7} {z}, ymm23
-// CHECK: vrsqrtpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vrsqrtbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vrsqrtpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
+ vrsqrtbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vrsqrtpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vrsqrtbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x7c,0x0f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vrsqrtpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
+ vrsqrtbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vrsqrtpbf16 xmm22, word ptr [rip]{1to8}
+// CHECK: vrsqrtbf16 xmm22, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x7c,0x18,0x4e,0x35,0x00,0x00,0x00,0x00]
- vrsqrtpbf16 xmm22, word ptr [rip]{1to8}
+ vrsqrtbf16 xmm22, word ptr [rip]{1to8}
-// CHECK: vrsqrtpbf16 xmm22, xmmword ptr [2*rbp - 512]
+// CHECK: vrsqrtbf16 xmm22, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x7c,0x08,0x4e,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vrsqrtpbf16 xmm22, xmmword ptr [2*rbp - 512]
+ vrsqrtbf16 xmm22, xmmword ptr [2*rbp - 512]
-// CHECK: vrsqrtpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
+// CHECK: vrsqrtbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x7c,0x8f,0x4e,0x71,0x7f]
- vrsqrtpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
+ vrsqrtbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
-// CHECK: vrsqrtpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
+// CHECK: vrsqrtbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x7c,0x9f,0x4e,0x72,0x80]
- vrsqrtpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
+ vrsqrtbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
-// CHECK: vrsqrtpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vrsqrtbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vrsqrtpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
+ vrsqrtbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vrsqrtpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vrsqrtbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x7c,0x2f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vrsqrtpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
+ vrsqrtbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vrsqrtpbf16 ymm22, word ptr [rip]{1to16}
+// CHECK: vrsqrtbf16 ymm22, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x7c,0x38,0x4e,0x35,0x00,0x00,0x00,0x00]
- vrsqrtpbf16 ymm22, word ptr [rip]{1to16}
+ vrsqrtbf16 ymm22, word ptr [rip]{1to16}
-// CHECK: vrsqrtpbf16 ymm22, ymmword ptr [2*rbp - 1024]
+// CHECK: vrsqrtbf16 ymm22, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x7c,0x28,0x4e,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vrsqrtpbf16 ymm22, ymmword ptr [2*rbp - 1024]
+ vrsqrtbf16 ymm22, ymmword ptr [2*rbp - 1024]
-// CHECK: vrsqrtpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
+// CHECK: vrsqrtbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x7c,0xaf,0x4e,0x71,0x7f]
- vrsqrtpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
+ vrsqrtbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
-// CHECK: vrsqrtpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
+// CHECK: vrsqrtbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x7c,0xbf,0x4e,0x72,0x80]
- vrsqrtpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
+ vrsqrtbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
-// CHECK: vrsqrtpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vrsqrtbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vrsqrtpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
+ vrsqrtbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vrsqrtpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vrsqrtbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x7c,0x4f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00]
- vrsqrtpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
+ vrsqrtbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vrsqrtpbf16 zmm22, word ptr [rip]{1to32}
+// CHECK: vrsqrtbf16 zmm22, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x7c,0x58,0x4e,0x35,0x00,0x00,0x00,0x00]
- vrsqrtpbf16 zmm22, word ptr [rip]{1to32}
+ vrsqrtbf16 zmm22, word ptr [rip]{1to32}
-// CHECK: vrsqrtpbf16 zmm22, zmmword ptr [2*rbp - 2048]
+// CHECK: vrsqrtbf16 zmm22, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x7c,0x48,0x4e,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vrsqrtpbf16 zmm22, zmmword ptr [2*rbp - 2048]
+ vrsqrtbf16 zmm22, zmmword ptr [2*rbp - 2048]
-// CHECK: vrsqrtpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
+// CHECK: vrsqrtbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x7c,0xcf,0x4e,0x71,0x7f]
- vrsqrtpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
+ vrsqrtbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
-// CHECK: vrsqrtpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
+// CHECK: vrsqrtbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x7c,0xdf,0x4e,0x72,0x80]
- vrsqrtpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
+ vrsqrtbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
-// CHECK: vscalefpbf16 ymm22, ymm23, ymm24
+// CHECK: vscalefbf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x20,0x2c,0xf0]
- vscalefpbf16 ymm22, ymm23, ymm24
+ vscalefbf16 ymm22, ymm23, ymm24
-// CHECK: vscalefpbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vscalefbf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0x27,0x2c,0xf0]
- vscalefpbf16 ymm22 {k7}, ymm23, ymm24
+ vscalefbf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vscalefpbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vscalefbf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x86,0x44,0xa7,0x2c,0xf0]
- vscalefpbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vscalefbf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vscalefpbf16 zmm22, zmm23, zmm24
+// CHECK: vscalefbf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x40,0x2c,0xf0]
- vscalefpbf16 zmm22, zmm23, zmm24
+ vscalefbf16 zmm22, zmm23, zmm24
-// CHECK: vscalefpbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vscalefbf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0x47,0x2c,0xf0]
- vscalefpbf16 zmm22 {k7}, zmm23, zmm24
+ vscalefbf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vscalefpbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vscalefbf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x86,0x44,0xc7,0x2c,0xf0]
- vscalefpbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vscalefbf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vscalefpbf16 xmm22, xmm23, xmm24
+// CHECK: vscalefbf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x00,0x2c,0xf0]
- vscalefpbf16 xmm22, xmm23, xmm24
+ vscalefbf16 xmm22, xmm23, xmm24
-// CHECK: vscalefpbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vscalefbf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x07,0x2c,0xf0]
- vscalefpbf16 xmm22 {k7}, xmm23, xmm24
+ vscalefbf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vscalefpbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vscalefbf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x86,0x44,0x87,0x2c,0xf0]
- vscalefpbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vscalefbf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vscalefpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vscalefbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x40,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vscalefpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vscalefbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vscalefpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vscalefbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x47,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vscalefpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vscalefbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vscalefpbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vscalefbf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0x50,0x2c,0x35,0x00,0x00,0x00,0x00]
- vscalefpbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vscalefbf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vscalefpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vscalefbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe6,0x44,0x40,0x2c,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vscalefpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vscalefbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vscalefpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vscalefbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x2c,0x71,0x7f]
- vscalefpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vscalefbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vscalefpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vscalefbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x2c,0x72,0x80]
- vscalefpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vscalefbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vscalefpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vscalefbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x20,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vscalefpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vscalefbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vscalefpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vscalefbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x27,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vscalefpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vscalefbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vscalefpbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vscalefbf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0x30,0x2c,0x35,0x00,0x00,0x00,0x00]
- vscalefpbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vscalefbf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vscalefpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vscalefbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe6,0x44,0x20,0x2c,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vscalefpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vscalefbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vscalefpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vscalefbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x2c,0x71,0x7f]
- vscalefpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vscalefbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vscalefpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vscalefbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x2c,0x72,0x80]
- vscalefpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vscalefbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vscalefpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vscalefbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa6,0x44,0x00,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vscalefpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vscalefbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vscalefpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vscalefbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc6,0x44,0x07,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vscalefpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vscalefbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vscalefpbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vscalefbf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x10,0x2c,0x35,0x00,0x00,0x00,0x00]
- vscalefpbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vscalefbf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vscalefpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vscalefbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe6,0x44,0x00,0x2c,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vscalefpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vscalefbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vscalefpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vscalefbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe6,0x44,0x87,0x2c,0x71,0x7f]
- vscalefpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vscalefbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vscalefpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vscalefbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe6,0x44,0x97,0x2c,0x72,0x80]
- vscalefpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vscalefbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
-// CHECK: vsqrtnepbf16 xmm22, xmm23
+// CHECK: vsqrtbf16 xmm22, xmm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x51,0xf7]
- vsqrtnepbf16 xmm22, xmm23
+ vsqrtbf16 xmm22, xmm23
-// CHECK: vsqrtnepbf16 xmm22 {k7}, xmm23
+// CHECK: vsqrtbf16 xmm22 {k7}, xmm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x0f,0x51,0xf7]
- vsqrtnepbf16 xmm22 {k7}, xmm23
+ vsqrtbf16 xmm22 {k7}, xmm23
-// CHECK: vsqrtnepbf16 xmm22 {k7} {z}, xmm23
+// CHECK: vsqrtbf16 xmm22 {k7} {z}, xmm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x8f,0x51,0xf7]
- vsqrtnepbf16 xmm22 {k7} {z}, xmm23
+ vsqrtbf16 xmm22 {k7} {z}, xmm23
-// CHECK: vsqrtnepbf16 zmm22, zmm23
+// CHECK: vsqrtbf16 zmm22, zmm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x51,0xf7]
- vsqrtnepbf16 zmm22, zmm23
+ vsqrtbf16 zmm22, zmm23
-// CHECK: vsqrtnepbf16 zmm22 {k7}, zmm23
+// CHECK: vsqrtbf16 zmm22 {k7}, zmm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x4f,0x51,0xf7]
- vsqrtnepbf16 zmm22 {k7}, zmm23
+ vsqrtbf16 zmm22 {k7}, zmm23
-// CHECK: vsqrtnepbf16 zmm22 {k7} {z}, zmm23
+// CHECK: vsqrtbf16 zmm22 {k7} {z}, zmm23
// CHECK: encoding: [0x62,0xa5,0x7d,0xcf,0x51,0xf7]
- vsqrtnepbf16 zmm22 {k7} {z}, zmm23
+ vsqrtbf16 zmm22 {k7} {z}, zmm23
-// CHECK: vsqrtnepbf16 ymm22, ymm23
+// CHECK: vsqrtbf16 ymm22, ymm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x51,0xf7]
- vsqrtnepbf16 ymm22, ymm23
+ vsqrtbf16 ymm22, ymm23
-// CHECK: vsqrtnepbf16 ymm22 {k7}, ymm23
+// CHECK: vsqrtbf16 ymm22 {k7}, ymm23
// CHECK: encoding: [0x62,0xa5,0x7d,0x2f,0x51,0xf7]
- vsqrtnepbf16 ymm22 {k7}, ymm23
+ vsqrtbf16 ymm22 {k7}, ymm23
-// CHECK: vsqrtnepbf16 ymm22 {k7} {z}, ymm23
+// CHECK: vsqrtbf16 ymm22 {k7} {z}, ymm23
// CHECK: encoding: [0x62,0xa5,0x7d,0xaf,0x51,0xf7]
- vsqrtnepbf16 ymm22 {k7} {z}, ymm23
+ vsqrtbf16 ymm22 {k7} {z}, ymm23
-// CHECK: vsqrtnepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vsqrtbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vsqrtnepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
+ vsqrtbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vsqrtnepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vsqrtbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x7d,0x0f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00]
- vsqrtnepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
+ vsqrtbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vsqrtnepbf16 xmm22, word ptr [rip]{1to8}
+// CHECK: vsqrtbf16 xmm22, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe5,0x7d,0x18,0x51,0x35,0x00,0x00,0x00,0x00]
- vsqrtnepbf16 xmm22, word ptr [rip]{1to8}
+ vsqrtbf16 xmm22, word ptr [rip]{1to8}
-// CHECK: vsqrtnepbf16 xmm22, xmmword ptr [2*rbp - 512]
+// CHECK: vsqrtbf16 xmm22, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe5,0x7d,0x08,0x51,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vsqrtnepbf16 xmm22, xmmword ptr [2*rbp - 512]
+ vsqrtbf16 xmm22, xmmword ptr [2*rbp - 512]
-// CHECK: vsqrtnepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
+// CHECK: vsqrtbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe5,0x7d,0x8f,0x51,0x71,0x7f]
- vsqrtnepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
+ vsqrtbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032]
-// CHECK: vsqrtnepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
+// CHECK: vsqrtbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe5,0x7d,0x9f,0x51,0x72,0x80]
- vsqrtnepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
+ vsqrtbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}
-// CHECK: vsqrtnepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vsqrtbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vsqrtnepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
+ vsqrtbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vsqrtnepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vsqrtbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x7d,0x2f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00]
- vsqrtnepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
+ vsqrtbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vsqrtnepbf16 ymm22, word ptr [rip]{1to16}
+// CHECK: vsqrtbf16 ymm22, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe5,0x7d,0x38,0x51,0x35,0x00,0x00,0x00,0x00]
- vsqrtnepbf16 ymm22, word ptr [rip]{1to16}
+ vsqrtbf16 ymm22, word ptr [rip]{1to16}
-// CHECK: vsqrtnepbf16 ymm22, ymmword ptr [2*rbp - 1024]
+// CHECK: vsqrtbf16 ymm22, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe5,0x7d,0x28,0x51,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vsqrtnepbf16 ymm22, ymmword ptr [2*rbp - 1024]
+ vsqrtbf16 ymm22, ymmword ptr [2*rbp - 1024]
-// CHECK: vsqrtnepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
+// CHECK: vsqrtbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe5,0x7d,0xaf,0x51,0x71,0x7f]
- vsqrtnepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
+ vsqrtbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064]
-// CHECK: vsqrtnepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
+// CHECK: vsqrtbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe5,0x7d,0xbf,0x51,0x72,0x80]
- vsqrtnepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
+ vsqrtbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}
-// CHECK: vsqrtnepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vsqrtbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vsqrtnepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
+ vsqrtbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vsqrtnepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vsqrtbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x7d,0x4f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00]
- vsqrtnepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
+ vsqrtbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vsqrtnepbf16 zmm22, word ptr [rip]{1to32}
+// CHECK: vsqrtbf16 zmm22, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe5,0x7d,0x58,0x51,0x35,0x00,0x00,0x00,0x00]
- vsqrtnepbf16 zmm22, word ptr [rip]{1to32}
+ vsqrtbf16 zmm22, word ptr [rip]{1to32}
-// CHECK: vsqrtnepbf16 zmm22, zmmword ptr [2*rbp - 2048]
+// CHECK: vsqrtbf16 zmm22, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe5,0x7d,0x48,0x51,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vsqrtnepbf16 zmm22, zmmword ptr [2*rbp - 2048]
+ vsqrtbf16 zmm22, zmmword ptr [2*rbp - 2048]
-// CHECK: vsqrtnepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
+// CHECK: vsqrtbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe5,0x7d,0xcf,0x51,0x71,0x7f]
- vsqrtnepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
+ vsqrtbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128]
-// CHECK: vsqrtnepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
+// CHECK: vsqrtbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe5,0x7d,0xdf,0x51,0x72,0x80]
- vsqrtnepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
+ vsqrtbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}
-// CHECK: vsubnepbf16 ymm22, ymm23, ymm24
+// CHECK: vsubbf16 ymm22, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0x20,0x5c,0xf0]
- vsubnepbf16 ymm22, ymm23, ymm24
+ vsubbf16 ymm22, ymm23, ymm24
-// CHECK: vsubnepbf16 ymm22 {k7}, ymm23, ymm24
+// CHECK: vsubbf16 ymm22 {k7}, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0x27,0x5c,0xf0]
- vsubnepbf16 ymm22 {k7}, ymm23, ymm24
+ vsubbf16 ymm22 {k7}, ymm23, ymm24
-// CHECK: vsubnepbf16 ymm22 {k7} {z}, ymm23, ymm24
+// CHECK: vsubbf16 ymm22 {k7} {z}, ymm23, ymm24
// CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5c,0xf0]
- vsubnepbf16 ymm22 {k7} {z}, ymm23, ymm24
+ vsubbf16 ymm22 {k7} {z}, ymm23, ymm24
-// CHECK: vsubnepbf16 zmm22, zmm23, zmm24
+// CHECK: vsubbf16 zmm22, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0x40,0x5c,0xf0]
- vsubnepbf16 zmm22, zmm23, zmm24
+ vsubbf16 zmm22, zmm23, zmm24
-// CHECK: vsubnepbf16 zmm22 {k7}, zmm23, zmm24
+// CHECK: vsubbf16 zmm22 {k7}, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0x47,0x5c,0xf0]
- vsubnepbf16 zmm22 {k7}, zmm23, zmm24
+ vsubbf16 zmm22 {k7}, zmm23, zmm24
-// CHECK: vsubnepbf16 zmm22 {k7} {z}, zmm23, zmm24
+// CHECK: vsubbf16 zmm22 {k7} {z}, zmm23, zmm24
// CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5c,0xf0]
- vsubnepbf16 zmm22 {k7} {z}, zmm23, zmm24
+ vsubbf16 zmm22 {k7} {z}, zmm23, zmm24
-// CHECK: vsubnepbf16 xmm22, xmm23, xmm24
+// CHECK: vsubbf16 xmm22, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x00,0x5c,0xf0]
- vsubnepbf16 xmm22, xmm23, xmm24
+ vsubbf16 xmm22, xmm23, xmm24
-// CHECK: vsubnepbf16 xmm22 {k7}, xmm23, xmm24
+// CHECK: vsubbf16 xmm22 {k7}, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x07,0x5c,0xf0]
- vsubnepbf16 xmm22 {k7}, xmm23, xmm24
+ vsubbf16 xmm22 {k7}, xmm23, xmm24
-// CHECK: vsubnepbf16 xmm22 {k7} {z}, xmm23, xmm24
+// CHECK: vsubbf16 xmm22 {k7} {z}, xmm23, xmm24
// CHECK: encoding: [0x62,0x85,0x45,0x87,0x5c,0xf0]
- vsubnepbf16 xmm22 {k7} {z}, xmm23, xmm24
+ vsubbf16 xmm22 {k7} {z}, xmm23, xmm24
-// CHECK: vsubnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vsubbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vsubnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
+ vsubbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vsubnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+// CHECK: vsubbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vsubnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
+ vsubbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291]
-// CHECK: vsubnepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+// CHECK: vsubbf16 zmm22, zmm23, word ptr [rip]{1to32}
// CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5c,0x35,0x00,0x00,0x00,0x00]
- vsubnepbf16 zmm22, zmm23, word ptr [rip]{1to32}
+ vsubbf16 zmm22, zmm23, word ptr [rip]{1to32}
-// CHECK: vsubnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+// CHECK: vsubbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
// CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5c,0x34,0x6d,0x00,0xf8,0xff,0xff]
- vsubnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
+ vsubbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048]
-// CHECK: vsubnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+// CHECK: vsubbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
// CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5c,0x71,0x7f]
- vsubnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
+ vsubbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128]
-// CHECK: vsubnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+// CHECK: vsubbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
// CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5c,0x72,0x80]
- vsubnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
+ vsubbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32}
-// CHECK: vsubnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vsubbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vsubnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
+ vsubbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vsubnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+// CHECK: vsubbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vsubnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
+ vsubbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291]
-// CHECK: vsubnepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+// CHECK: vsubbf16 ymm22, ymm23, word ptr [rip]{1to16}
// CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5c,0x35,0x00,0x00,0x00,0x00]
- vsubnepbf16 ymm22, ymm23, word ptr [rip]{1to16}
+ vsubbf16 ymm22, ymm23, word ptr [rip]{1to16}
-// CHECK: vsubnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+// CHECK: vsubbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
// CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5c,0x34,0x6d,0x00,0xfc,0xff,0xff]
- vsubnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
+ vsubbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024]
-// CHECK: vsubnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+// CHECK: vsubbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
// CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5c,0x71,0x7f]
- vsubnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
+ vsubbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064]
-// CHECK: vsubnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+// CHECK: vsubbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
// CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5c,0x72,0x80]
- vsubnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
+ vsubbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16}
-// CHECK: vsubnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+// CHECK: vsubbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10]
- vsubnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
+ vsubbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456]
-// CHECK: vsubnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+// CHECK: vsubbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
// CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00]
- vsubnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
+ vsubbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291]
-// CHECK: vsubnepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+// CHECK: vsubbf16 xmm22, xmm23, word ptr [rip]{1to8}
// CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5c,0x35,0x00,0x00,0x00,0x00]
- vsubnepbf16 xmm22, xmm23, word ptr [rip]{1to8}
+ vsubbf16 xmm22, xmm23, word ptr [rip]{1to8}
-// CHECK: vsubnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+// CHECK: vsubbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
// CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5c,0x34,0x6d,0x00,0xfe,0xff,0xff]
- vsubnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
+ vsubbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512]
-// CHECK: vsubnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+// CHECK: vsubbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
// CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5c,0x71,0x7f]
- vsubnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
+ vsubbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032]
-// CHECK: vsubnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+// CHECK: vsubbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
// CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5c,0x72,0x80]
- vsubnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
+ vsubbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8}
diff --git a/llvm/test/TableGen/x86-fold-tables.inc b/llvm/test/TableGen/x86-fold-tables.inc
index 954c05bdb20767..f2a3ba854c1270 100644
--- a/llvm/test/TableGen/x86-fold-tables.inc
+++ b/llvm/test/TableGen/x86-fold-tables.inc
@@ -1506,9 +1506,9 @@ static const X86FoldTableEntry Table1[] = {
{X86::VEXPANDPSZ128rr, X86::VEXPANDPSZ128rm, TB_NO_REVERSE},
{X86::VEXPANDPSZ256rr, X86::VEXPANDPSZ256rm, TB_NO_REVERSE},
{X86::VEXPANDPSZrr, X86::VEXPANDPSZrm, TB_NO_REVERSE},
- {X86::VFPCLASSPBF16Z128ri, X86::VFPCLASSPBF16Z128mi, 0},
- {X86::VFPCLASSPBF16Z256ri, X86::VFPCLASSPBF16Z256mi, 0},
- {X86::VFPCLASSPBF16Zri, X86::VFPCLASSPBF16Zmi, 0},
+ {X86::VFPCLASSBF16Z128ri, X86::VFPCLASSBF16Z128mi, 0},
+ {X86::VFPCLASSBF16Z256ri, X86::VFPCLASSBF16Z256mi, 0},
+ {X86::VFPCLASSBF16Zri, X86::VFPCLASSBF16Zmi, 0},
{X86::VFPCLASSPDZ128ri, X86::VFPCLASSPDZ128mi, 0},
{X86::VFPCLASSPDZ256ri, X86::VFPCLASSPDZ256mi, 0},
{X86::VFPCLASSPDZri, X86::VFPCLASSPDZmi, 0},
@@ -1527,9 +1527,9 @@ static const X86FoldTableEntry Table1[] = {
{X86::VFRCZPSrr, X86::VFRCZPSrm, 0},
{X86::VFRCZSDrr, X86::VFRCZSDrm, TB_NO_REVERSE},
{X86::VFRCZSSrr, X86::VFRCZSSrm, TB_NO_REVERSE},
- {X86::VGETEXPPBF16Z128r, X86::VGETEXPPBF16Z128m, 0},
- {X86::VGETEXPPBF16Z256r, X86::VGETEXPPBF16Z256m, 0},
- {X86::VGETEXPPBF16Zr, X86::VGETEXPPBF16Zm, 0},
+ {X86::VGETEXPBF16Z128r, X86::VGETEXPBF16Z128m, 0},
+ {X86::VGETEXPBF16Z256r, X86::VGETEXPBF16Z256m, 0},
+ {X86::VGETEXPBF16Zr, X86::VGETEXPBF16Zm, 0},
{X86::VGETEXPPDZ128r, X86::VGETEXPPDZ128m, 0},
{X86::VGETEXPPDZ256r, X86::VGETEXPPDZ256m, 0},
{X86::VGETEXPPDZr, X86::VGETEXPPDZm, 0},
@@ -1539,9 +1539,9 @@ static const X86FoldTableEntry Table1[] = {
{X86::VGETEXPPSZ128r, X86::VGETEXPPSZ128m, 0},
{X86::VGETEXPPSZ256r, X86::VGETEXPPSZ256m, 0},
{X86::VGETEXPPSZr, X86::VGETEXPPSZm, 0},
- {X86::VGETMANTPBF16Z128rri, X86::VGETMANTPBF16Z128rmi, 0},
- {X86::VGETMANTPBF16Z256rri, X86::VGETMANTPBF16Z256rmi, 0},
- {X86::VGETMANTPBF16Zrri, X86::VGETMANTPBF16Zrmi, 0},
+ {X86::VGETMANTBF16Z128rri, X86::VGETMANTBF16Z128rmi, 0},
+ {X86::VGETMANTBF16Z256rri, X86::VGETMANTBF16Z256rmi, 0},
+ {X86::VGETMANTBF16Zrri, X86::VGETMANTBF16Zrmi, 0},
{X86::VGETMANTPDZ128rri, X86::VGETMANTPDZ128rmi, 0},
{X86::VGETMANTPDZ256rri, X86::VGETMANTPDZ256rmi, 0},
{X86::VGETMANTPDZrri, X86::VGETMANTPDZrmi, 0},
@@ -1877,17 +1877,17 @@ static const X86FoldTableEntry Table1[] = {
{X86::VRCP14PSZr, X86::VRCP14PSZm, 0},
{X86::VRCP28PDZr, X86::VRCP28PDZm, 0},
{X86::VRCP28PSZr, X86::VRCP28PSZm, 0},
- {X86::VRCPPBF16Z128r, X86::VRCPPBF16Z128m, 0},
- {X86::VRCPPBF16Z256r, X86::VRCPPBF16Z256m, 0},
- {X86::VRCPPBF16Zr, X86::VRCPPBF16Zm, 0},
+ {X86::VRCPBF16Z128r, X86::VRCPBF16Z128m, 0},
+ {X86::VRCPBF16Z256r, X86::VRCPBF16Z256m, 0},
+ {X86::VRCPBF16Zr, X86::VRCPBF16Zm, 0},
{X86::VRCPPHZ128r, X86::VRCPPHZ128m, 0},
{X86::VRCPPHZ256r, X86::VRCPPHZ256m, 0},
{X86::VRCPPHZr, X86::VRCPPHZm, 0},
{X86::VRCPPSYr, X86::VRCPPSYm, 0},
{X86::VRCPPSr, X86::VRCPPSm, 0},
- {X86::VREDUCENEPBF16Z128rri, X86::VREDUCENEPBF16Z128rmi, 0},
- {X86::VREDUCENEPBF16Z256rri, X86::VREDUCENEPBF16Z256rmi, 0},
- {X86::VREDUCENEPBF16Zrri, X86::VREDUCENEPBF16Zrmi, 0},
+ {X86::VREDUCEBF16Z128rri, X86::VREDUCEBF16Z128rmi, 0},
+ {X86::VREDUCEBF16Z256rri, X86::VREDUCEBF16Z256rmi, 0},
+ {X86::VREDUCEBF16Zrri, X86::VREDUCEBF16Zrmi, 0},
{X86::VREDUCEPDZ128rri, X86::VREDUCEPDZ128rmi, 0},
{X86::VREDUCEPDZ256rri, X86::VREDUCEPDZ256rmi, 0},
{X86::VREDUCEPDZrri, X86::VREDUCEPDZrmi, 0},
@@ -1897,9 +1897,9 @@ static const X86FoldTableEntry Table1[] = {
{X86::VREDUCEPSZ128rri, X86::VREDUCEPSZ128rmi, 0},
{X86::VREDUCEPSZ256rri, X86::VREDUCEPSZ256rmi, 0},
{X86::VREDUCEPSZrri, X86::VREDUCEPSZrmi, 0},
- {X86::VRNDSCALENEPBF16Z128rri, X86::VRNDSCALENEPBF16Z128rmi, 0},
- {X86::VRNDSCALENEPBF16Z256rri, X86::VRNDSCALENEPBF16Z256rmi, 0},
- {X86::VRNDSCALENEPBF16Zrri, X86::VRNDSCALENEPBF16Zrmi, 0},
+ {X86::VRNDSCALEBF16Z128rri, X86::VRNDSCALEBF16Z128rmi, 0},
+ {X86::VRNDSCALEBF16Z256rri, X86::VRNDSCALEBF16Z256rmi, 0},
+ {X86::VRNDSCALEBF16Zrri, X86::VRNDSCALEBF16Zrmi, 0},
{X86::VRNDSCALEPDZ128rri, X86::VRNDSCALEPDZ128rmi, 0},
{X86::VRNDSCALEPDZ256rri, X86::VRNDSCALEPDZ256rmi, 0},
{X86::VRNDSCALEPDZrri, X86::VRNDSCALEPDZrmi, 0},
@@ -1921,17 +1921,17 @@ static const X86FoldTableEntry Table1[] = {
{X86::VRSQRT14PSZr, X86::VRSQRT14PSZm, 0},
{X86::VRSQRT28PDZr, X86::VRSQRT28PDZm, 0},
{X86::VRSQRT28PSZr, X86::VRSQRT28PSZm, 0},
- {X86::VRSQRTPBF16Z128r, X86::VRSQRTPBF16Z128m, 0},
- {X86::VRSQRTPBF16Z256r, X86::VRSQRTPBF16Z256m, 0},
- {X86::VRSQRTPBF16Zr, X86::VRSQRTPBF16Zm, 0},
+ {X86::VRSQRTBF16Z128r, X86::VRSQRTBF16Z128m, 0},
+ {X86::VRSQRTBF16Z256r, X86::VRSQRTBF16Z256m, 0},
+ {X86::VRSQRTBF16Zr, X86::VRSQRTBF16Zm, 0},
{X86::VRSQRTPHZ128r, X86::VRSQRTPHZ128m, 0},
{X86::VRSQRTPHZ256r, X86::VRSQRTPHZ256m, 0},
{X86::VRSQRTPHZr, X86::VRSQRTPHZm, 0},
{X86::VRSQRTPSYr, X86::VRSQRTPSYm, 0},
{X86::VRSQRTPSr, X86::VRSQRTPSm, 0},
- {X86::VSQRTNEPBF16Z128r, X86::VSQRTNEPBF16Z128m, 0},
- {X86::VSQRTNEPBF16Z256r, X86::VSQRTNEPBF16Z256m, 0},
- {X86::VSQRTNEPBF16Zr, X86::VSQRTNEPBF16Zm, 0},
+ {X86::VSQRTBF16Z128r, X86::VSQRTBF16Z128m, 0},
+ {X86::VSQRTBF16Z256r, X86::VSQRTBF16Z256m, 0},
+ {X86::VSQRTBF16Zr, X86::VSQRTBF16Zm, 0},
{X86::VSQRTPDYr, X86::VSQRTPDYm, 0},
{X86::VSQRTPDZ128r, X86::VSQRTPDZ128m, 0},
{X86::VSQRTPDZ256r, X86::VSQRTPDZ256m, 0},
@@ -2412,9 +2412,9 @@ static const X86FoldTableEntry Table2[] = {
{X86::UNPCKHPSrr, X86::UNPCKHPSrm, TB_ALIGN_16},
{X86::UNPCKLPDrr, X86::UNPCKLPDrm, TB_ALIGN_16},
{X86::UNPCKLPSrr, X86::UNPCKLPSrm, TB_ALIGN_16},
- {X86::VADDNEPBF16Z128rr, X86::VADDNEPBF16Z128rm, 0},
- {X86::VADDNEPBF16Z256rr, X86::VADDNEPBF16Z256rm, 0},
- {X86::VADDNEPBF16Zrr, X86::VADDNEPBF16Zrm, 0},
+ {X86::VADDBF16Z128rr, X86::VADDBF16Z128rm, 0},
+ {X86::VADDBF16Z256rr, X86::VADDBF16Z256rm, 0},
+ {X86::VADDBF16Zrr, X86::VADDBF16Zrm, 0},
{X86::VADDPDYrr, X86::VADDPDYrm, 0},
{X86::VADDPDZ128rr, X86::VADDPDZ128rm, 0},
{X86::VADDPDZ256rr, X86::VADDPDZ256rm, 0},
@@ -2512,9 +2512,9 @@ static const X86FoldTableEntry Table2[] = {
{X86::VBROADCASTSSZ128rrkz, X86::VBROADCASTSSZ128rmkz, TB_NO_REVERSE},
{X86::VBROADCASTSSZ256rrkz, X86::VBROADCASTSSZ256rmkz, TB_NO_REVERSE},
{X86::VBROADCASTSSZrrkz, X86::VBROADCASTSSZrmkz, TB_NO_REVERSE},
- {X86::VCMPPBF16Z128rri, X86::VCMPPBF16Z128rmi, 0},
- {X86::VCMPPBF16Z256rri, X86::VCMPPBF16Z256rmi, 0},
- {X86::VCMPPBF16Zrri, X86::VCMPPBF16Zrmi, 0},
+ {X86::VCMPBF16Z128rri, X86::VCMPBF16Z128rmi, 0},
+ {X86::VCMPBF16Z256rri, X86::VCMPBF16Z256rmi, 0},
+ {X86::VCMPBF16Zrri, X86::VCMPBF16Zrmi, 0},
{X86::VCMPPDYrri, X86::VCMPPDYrmi, 0},
{X86::VCMPPDZ128rri, X86::VCMPPDZ128rmi, 0},
{X86::VCMPPDZ256rri, X86::VCMPPDZ256rmi, 0},
@@ -2844,9 +2844,9 @@ static const X86FoldTableEntry Table2[] = {
{X86::VDBPSADBWZ128rri, X86::VDBPSADBWZ128rmi, 0},
{X86::VDBPSADBWZ256rri, X86::VDBPSADBWZ256rmi, 0},
{X86::VDBPSADBWZrri, X86::VDBPSADBWZrmi, 0},
- {X86::VDIVNEPBF16Z128rr, X86::VDIVNEPBF16Z128rm, 0},
- {X86::VDIVNEPBF16Z256rr, X86::VDIVNEPBF16Z256rm, 0},
- {X86::VDIVNEPBF16Zrr, X86::VDIVNEPBF16Zrm, 0},
+ {X86::VDIVBF16Z128rr, X86::VDIVBF16Z128rm, 0},
+ {X86::VDIVBF16Z256rr, X86::VDIVBF16Z256rm, 0},
+ {X86::VDIVBF16Zrr, X86::VDIVBF16Zrm, 0},
{X86::VDIVPDYrr, X86::VDIVPDYrm, 0},
{X86::VDIVPDZ128rr, X86::VDIVPDZ128rm, 0},
{X86::VDIVPDZ256rr, X86::VDIVPDZ256rm, 0},
@@ -2929,9 +2929,9 @@ static const X86FoldTableEntry Table2[] = {
{X86::VFNMSUBSD4rr_Int, X86::VFNMSUBSD4mr_Int, TB_NO_REVERSE},
{X86::VFNMSUBSS4rr, X86::VFNMSUBSS4mr, 0},
{X86::VFNMSUBSS4rr_Int, X86::VFNMSUBSS4mr_Int, TB_NO_REVERSE},
- {X86::VFPCLASSPBF16Z128rik, X86::VFPCLASSPBF16Z128mik, 0},
- {X86::VFPCLASSPBF16Z256rik, X86::VFPCLASSPBF16Z256mik, 0},
- {X86::VFPCLASSPBF16Zrik, X86::VFPCLASSPBF16Zmik, 0},
+ {X86::VFPCLASSBF16Z128rik, X86::VFPCLASSBF16Z128mik, 0},
+ {X86::VFPCLASSBF16Z256rik, X86::VFPCLASSBF16Z256mik, 0},
+ {X86::VFPCLASSBF16Zrik, X86::VFPCLASSBF16Zmik, 0},
{X86::VFPCLASSPDZ128rik, X86::VFPCLASSPDZ128mik, 0},
{X86::VFPCLASSPDZ256rik, X86::VFPCLASSPDZ256mik, 0},
{X86::VFPCLASSPDZrik, X86::VFPCLASSPDZmik, 0},
@@ -2944,9 +2944,9 @@ static const X86FoldTableEntry Table2[] = {
{X86::VFPCLASSSDZrik, X86::VFPCLASSSDZmik, TB_NO_REVERSE},
{X86::VFPCLASSSHZrik, X86::VFPCLASSSHZmik, TB_NO_REVERSE},
{X86::VFPCLASSSSZrik, X86::VFPCLASSSSZmik, TB_NO_REVERSE},
- {X86::VGETEXPPBF16Z128rkz, X86::VGETEXPPBF16Z128mkz, 0},
- {X86::VGETEXPPBF16Z256rkz, X86::VGETEXPPBF16Z256mkz, 0},
- {X86::VGETEXPPBF16Zrkz, X86::VGETEXPPBF16Zmkz, 0},
+ {X86::VGETEXPBF16Z128rkz, X86::VGETEXPBF16Z128mkz, 0},
+ {X86::VGETEXPBF16Z256rkz, X86::VGETEXPBF16Z256mkz, 0},
+ {X86::VGETEXPBF16Zrkz, X86::VGETEXPBF16Zmkz, 0},
{X86::VGETEXPPDZ128rkz, X86::VGETEXPPDZ128mkz, 0},
{X86::VGETEXPPDZ256rkz, X86::VGETEXPPDZ256mkz, 0},
{X86::VGETEXPPDZrkz, X86::VGETEXPPDZmkz, 0},
@@ -2959,9 +2959,9 @@ static const X86FoldTableEntry Table2[] = {
{X86::VGETEXPSDZr, X86::VGETEXPSDZm, TB_NO_REVERSE},
{X86::VGETEXPSHZr, X86::VGETEXPSHZm, TB_NO_REVERSE},
{X86::VGETEXPSSZr, X86::VGETEXPSSZm, TB_NO_REVERSE},
- {X86::VGETMANTPBF16Z128rrikz, X86::VGETMANTPBF16Z128rmikz, 0},
- {X86::VGETMANTPBF16Z256rrikz, X86::VGETMANTPBF16Z256rmikz, 0},
- {X86::VGETMANTPBF16Zrrikz, X86::VGETMANTPBF16Zrmikz, 0},
+ {X86::VGETMANTBF16Z128rrikz, X86::VGETMANTBF16Z128rmikz, 0},
+ {X86::VGETMANTBF16Z256rrikz, X86::VGETMANTBF16Z256rmikz, 0},
+ {X86::VGETMANTBF16Zrrikz, X86::VGETMANTBF16Zrmikz, 0},
{X86::VGETMANTPDZ128rrikz, X86::VGETMANTPDZ128rmikz, 0},
{X86::VGETMANTPDZ256rrikz, X86::VGETMANTPDZ256rmikz, 0},
{X86::VGETMANTPDZrrikz, X86::VGETMANTPDZrmikz, 0},
@@ -3011,6 +3011,9 @@ static const X86FoldTableEntry Table2[] = {
{X86::VINSERTI64X2Z256rri, X86::VINSERTI64X2Z256rmi, 0},
{X86::VINSERTI64X2Zrri, X86::VINSERTI64X2Zrmi, 0},
{X86::VINSERTI64X4Zrri, X86::VINSERTI64X4Zrmi, 0},
+ {X86::VMAXBF16Z128rr, X86::VMAXBF16Z128rm, 0},
+ {X86::VMAXBF16Z256rr, X86::VMAXBF16Z256rm, 0},
+ {X86::VMAXBF16Zrr, X86::VMAXBF16Zrm, 0},
{X86::VMAXCPDYrr, X86::VMAXCPDYrm, 0},
{X86::VMAXCPDZ128rr, X86::VMAXCPDZ128rm, 0},
{X86::VMAXCPDZ256rr, X86::VMAXCPDZ256rm, 0},
@@ -3029,9 +3032,6 @@ static const X86FoldTableEntry Table2[] = {
{X86::VMAXCSHZrr, X86::VMAXCSHZrm, 0},
{X86::VMAXCSSZrr, X86::VMAXCSSZrm, 0},
{X86::VMAXCSSrr, X86::VMAXCSSrm, 0},
- {X86::VMAXPBF16Z128rr, X86::VMAXPBF16Z128rm, 0},
- {X86::VMAXPBF16Z256rr, X86::VMAXPBF16Z256rm, 0},
- {X86::VMAXPBF16Zrr, X86::VMAXPBF16Zrm, 0},
{X86::VMAXPDYrr, X86::VMAXPDYrm, 0},
{X86::VMAXPDZ128rr, X86::VMAXPDZ128rm, 0},
{X86::VMAXPDZ256rr, X86::VMAXPDZ256rm, 0},
@@ -3055,6 +3055,9 @@ static const X86FoldTableEntry Table2[] = {
{X86::VMAXSSZrr_Int, X86::VMAXSSZrm_Int, TB_NO_REVERSE},
{X86::VMAXSSrr, X86::VMAXSSrm, 0},
{X86::VMAXSSrr_Int, X86::VMAXSSrm_Int, TB_NO_REVERSE},
+ {X86::VMINBF16Z128rr, X86::VMINBF16Z128rm, 0},
+ {X86::VMINBF16Z256rr, X86::VMINBF16Z256rm, 0},
+ {X86::VMINBF16Zrr, X86::VMINBF16Zrm, 0},
{X86::VMINCPDYrr, X86::VMINCPDYrm, 0},
{X86::VMINCPDZ128rr, X86::VMINCPDZ128rm, 0},
{X86::VMINCPDZ256rr, X86::VMINCPDZ256rm, 0},
@@ -3091,9 +3094,6 @@ static const X86FoldTableEntry Table2[] = {
{X86::VMINMAXSHrri_Int, X86::VMINMAXSHrmi_Int, TB_NO_REVERSE},
{X86::VMINMAXSSrri, X86::VMINMAXSSrmi, 0},
{X86::VMINMAXSSrri_Int, X86::VMINMAXSSrmi_Int, TB_NO_REVERSE},
- {X86::VMINPBF16Z128rr, X86::VMINPBF16Z128rm, 0},
- {X86::VMINPBF16Z256rr, X86::VMINPBF16Z256rm, 0},
- {X86::VMINPBF16Zrr, X86::VMINPBF16Zrm, 0},
{X86::VMINPDYrr, X86::VMINPDYrm, 0},
{X86::VMINPDZ128rr, X86::VMINPDZ128rm, 0},
{X86::VMINPDZ256rr, X86::VMINPDZ256rm, 0},
@@ -3165,9 +3165,9 @@ static const X86FoldTableEntry Table2[] = {
{X86::VMPSADBWZ256rri, X86::VMPSADBWZ256rmi, 0},
{X86::VMPSADBWZrri, X86::VMPSADBWZrmi, 0},
{X86::VMPSADBWrri, X86::VMPSADBWrmi, 0},
- {X86::VMULNEPBF16Z128rr, X86::VMULNEPBF16Z128rm, 0},
- {X86::VMULNEPBF16Z256rr, X86::VMULNEPBF16Z256rm, 0},
- {X86::VMULNEPBF16Zrr, X86::VMULNEPBF16Zrm, 0},
+ {X86::VMULBF16Z128rr, X86::VMULBF16Z128rm, 0},
+ {X86::VMULBF16Z256rr, X86::VMULBF16Z256rm, 0},
+ {X86::VMULBF16Zrr, X86::VMULBF16Zrm, 0},
{X86::VMULPDYrr, X86::VMULPDYrm, 0},
{X86::VMULPDZ128rr, X86::VMULPDZ128rm, 0},
{X86::VMULPDZ256rr, X86::VMULPDZ256rm, 0},
@@ -4018,18 +4018,18 @@ static const X86FoldTableEntry Table2[] = {
{X86::VRCP28PSZrkz, X86::VRCP28PSZmkz, 0},
{X86::VRCP28SDZr, X86::VRCP28SDZm, TB_NO_REVERSE},
{X86::VRCP28SSZr, X86::VRCP28SSZm, TB_NO_REVERSE},
- {X86::VRCPPBF16Z128rkz, X86::VRCPPBF16Z128mkz, 0},
- {X86::VRCPPBF16Z256rkz, X86::VRCPPBF16Z256mkz, 0},
- {X86::VRCPPBF16Zrkz, X86::VRCPPBF16Zmkz, 0},
+ {X86::VRCPBF16Z128rkz, X86::VRCPBF16Z128mkz, 0},
+ {X86::VRCPBF16Z256rkz, X86::VRCPBF16Z256mkz, 0},
+ {X86::VRCPBF16Zrkz, X86::VRCPBF16Zmkz, 0},
{X86::VRCPPHZ128rkz, X86::VRCPPHZ128mkz, 0},
{X86::VRCPPHZ256rkz, X86::VRCPPHZ256mkz, 0},
{X86::VRCPPHZrkz, X86::VRCPPHZmkz, 0},
{X86::VRCPSHZrr, X86::VRCPSHZrm, TB_NO_REVERSE},
{X86::VRCPSSr, X86::VRCPSSm, 0},
{X86::VRCPSSr_Int, X86::VRCPSSm_Int, TB_NO_REVERSE},
- {X86::VREDUCENEPBF16Z128rrikz, X86::VREDUCENEPBF16Z128rmikz, 0},
- {X86::VREDUCENEPBF16Z256rrikz, X86::VREDUCENEPBF16Z256rmikz, 0},
- {X86::VREDUCENEPBF16Zrrikz, X86::VREDUCENEPBF16Zrmikz, 0},
+ {X86::VREDUCEBF16Z128rrikz, X86::VREDUCEBF16Z128rmikz, 0},
+ {X86::VREDUCEBF16Z256rrikz, X86::VREDUCEBF16Z256rmikz, 0},
+ {X86::VREDUCEBF16Zrrikz, X86::VREDUCEBF16Zrmikz, 0},
{X86::VREDUCEPDZ128rrikz, X86::VREDUCEPDZ128rmikz, 0},
{X86::VREDUCEPDZ256rrikz, X86::VREDUCEPDZ256rmikz, 0},
{X86::VREDUCEPDZrrikz, X86::VREDUCEPDZrmikz, 0},
@@ -4042,9 +4042,9 @@ static const X86FoldTableEntry Table2[] = {
{X86::VREDUCESDZrri, X86::VREDUCESDZrmi, TB_NO_REVERSE},
{X86::VREDUCESHZrri, X86::VREDUCESHZrmi, TB_NO_REVERSE},
{X86::VREDUCESSZrri, X86::VREDUCESSZrmi, TB_NO_REVERSE},
- {X86::VRNDSCALENEPBF16Z128rrikz, X86::VRNDSCALENEPBF16Z128rmikz, 0},
- {X86::VRNDSCALENEPBF16Z256rrikz, X86::VRNDSCALENEPBF16Z256rmikz, 0},
- {X86::VRNDSCALENEPBF16Zrrikz, X86::VRNDSCALENEPBF16Zrmikz, 0},
+ {X86::VRNDSCALEBF16Z128rrikz, X86::VRNDSCALEBF16Z128rmikz, 0},
+ {X86::VRNDSCALEBF16Z256rrikz, X86::VRNDSCALEBF16Z256rmikz, 0},
+ {X86::VRNDSCALEBF16Zrrikz, X86::VRNDSCALEBF16Zrmikz, 0},
{X86::VRNDSCALEPDZ128rrikz, X86::VRNDSCALEPDZ128rmikz, 0},
{X86::VRNDSCALEPDZ256rrikz, X86::VRNDSCALEPDZ256rmikz, 0},
{X86::VRNDSCALEPDZrrikz, X86::VRNDSCALEPDZrmikz, 0},
@@ -4076,18 +4076,18 @@ static const X86FoldTableEntry Table2[] = {
{X86::VRSQRT28PSZrkz, X86::VRSQRT28PSZmkz, 0},
{X86::VRSQRT28SDZr, X86::VRSQRT28SDZm, TB_NO_REVERSE},
{X86::VRSQRT28SSZr, X86::VRSQRT28SSZm, TB_NO_REVERSE},
- {X86::VRSQRTPBF16Z128rkz, X86::VRSQRTPBF16Z128mkz, 0},
- {X86::VRSQRTPBF16Z256rkz, X86::VRSQRTPBF16Z256mkz, 0},
- {X86::VRSQRTPBF16Zrkz, X86::VRSQRTPBF16Zmkz, 0},
+ {X86::VRSQRTBF16Z128rkz, X86::VRSQRTBF16Z128mkz, 0},
+ {X86::VRSQRTBF16Z256rkz, X86::VRSQRTBF16Z256mkz, 0},
+ {X86::VRSQRTBF16Zrkz, X86::VRSQRTBF16Zmkz, 0},
{X86::VRSQRTPHZ128rkz, X86::VRSQRTPHZ128mkz, 0},
{X86::VRSQRTPHZ256rkz, X86::VRSQRTPHZ256mkz, 0},
{X86::VRSQRTPHZrkz, X86::VRSQRTPHZmkz, 0},
{X86::VRSQRTSHZrr, X86::VRSQRTSHZrm, TB_NO_REVERSE},
{X86::VRSQRTSSr, X86::VRSQRTSSm, 0},
{X86::VRSQRTSSr_Int, X86::VRSQRTSSm_Int, TB_NO_REVERSE},
- {X86::VSCALEFPBF16Z128rr, X86::VSCALEFPBF16Z128rm, 0},
- {X86::VSCALEFPBF16Z256rr, X86::VSCALEFPBF16Z256rm, 0},
- {X86::VSCALEFPBF16Zrr, X86::VSCALEFPBF16Zrm, 0},
+ {X86::VSCALEFBF16Z128rr, X86::VSCALEFBF16Z128rm, 0},
+ {X86::VSCALEFBF16Z256rr, X86::VSCALEFBF16Z256rm, 0},
+ {X86::VSCALEFBF16Zrr, X86::VSCALEFBF16Zrm, 0},
{X86::VSCALEFPDZ128rr, X86::VSCALEFPDZ128rm, 0},
{X86::VSCALEFPDZ256rr, X86::VSCALEFPDZ256rm, 0},
{X86::VSCALEFPDZrr, X86::VSCALEFPDZrm, 0},
@@ -4128,9 +4128,9 @@ static const X86FoldTableEntry Table2[] = {
{X86::VSM4RNDS4Z256rr, X86::VSM4RNDS4Z256rm, 0},
{X86::VSM4RNDS4Zrr, X86::VSM4RNDS4Zrm, 0},
{X86::VSM4RNDS4rr, X86::VSM4RNDS4rm, 0},
- {X86::VSQRTNEPBF16Z128rkz, X86::VSQRTNEPBF16Z128mkz, 0},
- {X86::VSQRTNEPBF16Z256rkz, X86::VSQRTNEPBF16Z256mkz, 0},
- {X86::VSQRTNEPBF16Zrkz, X86::VSQRTNEPBF16Zmkz, 0},
+ {X86::VSQRTBF16Z128rkz, X86::VSQRTBF16Z128mkz, 0},
+ {X86::VSQRTBF16Z256rkz, X86::VSQRTBF16Z256mkz, 0},
+ {X86::VSQRTBF16Zrkz, X86::VSQRTBF16Zmkz, 0},
{X86::VSQRTPDZ128rkz, X86::VSQRTPDZ128mkz, 0},
{X86::VSQRTPDZ256rkz, X86::VSQRTPDZ256mkz, 0},
{X86::VSQRTPDZrkz, X86::VSQRTPDZmkz, 0},
@@ -4150,9 +4150,9 @@ static const X86FoldTableEntry Table2[] = {
{X86::VSQRTSSZr_Int, X86::VSQRTSSZm_Int, TB_NO_REVERSE},
{X86::VSQRTSSr, X86::VSQRTSSm, 0},
{X86::VSQRTSSr_Int, X86::VSQRTSSm_Int, TB_NO_REVERSE},
- {X86::VSUBNEPBF16Z128rr, X86::VSUBNEPBF16Z128rm, 0},
- {X86::VSUBNEPBF16Z256rr, X86::VSUBNEPBF16Z256rm, 0},
- {X86::VSUBNEPBF16Zrr, X86::VSUBNEPBF16Zrm, 0},
+ {X86::VSUBBF16Z128rr, X86::VSUBBF16Z128rm, 0},
+ {X86::VSUBBF16Z256rr, X86::VSUBBF16Z256rm, 0},
+ {X86::VSUBBF16Zrr, X86::VSUBBF16Zrm, 0},
{X86::VSUBPDYrr, X86::VSUBPDYrm, 0},
{X86::VSUBPDZ128rr, X86::VSUBPDZ128rm, 0},
{X86::VSUBPDZ256rr, X86::VSUBPDZ256rm, 0},
@@ -4227,9 +4227,9 @@ static const X86FoldTableEntry Table2[] = {
};
static const X86FoldTableEntry Table3[] = {
- {X86::VADDNEPBF16Z128rrkz, X86::VADDNEPBF16Z128rmkz, 0},
- {X86::VADDNEPBF16Z256rrkz, X86::VADDNEPBF16Z256rmkz, 0},
- {X86::VADDNEPBF16Zrrkz, X86::VADDNEPBF16Zrmkz, 0},
+ {X86::VADDBF16Z128rrkz, X86::VADDBF16Z128rmkz, 0},
+ {X86::VADDBF16Z256rrkz, X86::VADDBF16Z256rmkz, 0},
+ {X86::VADDBF16Zrrkz, X86::VADDBF16Zrmkz, 0},
{X86::VADDPDZ128rrkz, X86::VADDPDZ128rmkz, 0},
{X86::VADDPDZ256rrkz, X86::VADDPDZ256rmkz, 0},
{X86::VADDPDZrrkz, X86::VADDPDZrmkz, 0},
@@ -4276,9 +4276,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VBROADCASTSSZ128rrk, X86::VBROADCASTSSZ128rmk, TB_NO_REVERSE},
{X86::VBROADCASTSSZ256rrk, X86::VBROADCASTSSZ256rmk, TB_NO_REVERSE},
{X86::VBROADCASTSSZrrk, X86::VBROADCASTSSZrmk, TB_NO_REVERSE},
- {X86::VCMPPBF16Z128rrik, X86::VCMPPBF16Z128rmik, 0},
- {X86::VCMPPBF16Z256rrik, X86::VCMPPBF16Z256rmik, 0},
- {X86::VCMPPBF16Zrrik, X86::VCMPPBF16Zrmik, 0},
+ {X86::VCMPBF16Z128rrik, X86::VCMPBF16Z128rmik, 0},
+ {X86::VCMPBF16Z256rrik, X86::VCMPBF16Z256rmik, 0},
+ {X86::VCMPBF16Zrrik, X86::VCMPBF16Zrmik, 0},
{X86::VCMPPDZ128rrik, X86::VCMPPDZ128rmik, 0},
{X86::VCMPPDZ256rrik, X86::VCMPPDZ256rmik, 0},
{X86::VCMPPDZrrik, X86::VCMPPDZrmik, 0},
@@ -4555,9 +4555,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VDBPSADBWZ128rrikz, X86::VDBPSADBWZ128rmikz, 0},
{X86::VDBPSADBWZ256rrikz, X86::VDBPSADBWZ256rmikz, 0},
{X86::VDBPSADBWZrrikz, X86::VDBPSADBWZrmikz, 0},
- {X86::VDIVNEPBF16Z128rrkz, X86::VDIVNEPBF16Z128rmkz, 0},
- {X86::VDIVNEPBF16Z256rrkz, X86::VDIVNEPBF16Z256rmkz, 0},
- {X86::VDIVNEPBF16Zrrkz, X86::VDIVNEPBF16Zrmkz, 0},
+ {X86::VDIVBF16Z128rrkz, X86::VDIVBF16Z128rmkz, 0},
+ {X86::VDIVBF16Z256rrkz, X86::VDIVBF16Z256rmkz, 0},
+ {X86::VDIVBF16Zrrkz, X86::VDIVBF16Zrmkz, 0},
{X86::VDIVPDZ128rrkz, X86::VDIVPDZ128rmkz, 0},
{X86::VDIVPDZ256rrkz, X86::VDIVPDZ256rmkz, 0},
{X86::VDIVPDZrrkz, X86::VDIVPDZrmkz, 0},
@@ -4600,9 +4600,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VFIXUPIMMPSZrri, X86::VFIXUPIMMPSZrmi, 0},
{X86::VFIXUPIMMSDZrri, X86::VFIXUPIMMSDZrmi, TB_NO_REVERSE},
{X86::VFIXUPIMMSSZrri, X86::VFIXUPIMMSSZrmi, TB_NO_REVERSE},
- {X86::VFMADD132NEPBF16Z128r, X86::VFMADD132NEPBF16Z128m, 0},
- {X86::VFMADD132NEPBF16Z256r, X86::VFMADD132NEPBF16Z256m, 0},
- {X86::VFMADD132NEPBF16Zr, X86::VFMADD132NEPBF16Zm, 0},
+ {X86::VFMADD132BF16Z128r, X86::VFMADD132BF16Z128m, 0},
+ {X86::VFMADD132BF16Z256r, X86::VFMADD132BF16Z256m, 0},
+ {X86::VFMADD132BF16Zr, X86::VFMADD132BF16Zm, 0},
{X86::VFMADD132PDYr, X86::VFMADD132PDYm, 0},
{X86::VFMADD132PDZ128r, X86::VFMADD132PDZ128m, 0},
{X86::VFMADD132PDZ256r, X86::VFMADD132PDZ256m, 0},
@@ -4626,9 +4626,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VFMADD132SSZr_Int, X86::VFMADD132SSZm_Int, TB_NO_REVERSE},
{X86::VFMADD132SSr, X86::VFMADD132SSm, 0},
{X86::VFMADD132SSr_Int, X86::VFMADD132SSm_Int, TB_NO_REVERSE},
- {X86::VFMADD213NEPBF16Z128r, X86::VFMADD213NEPBF16Z128m, 0},
- {X86::VFMADD213NEPBF16Z256r, X86::VFMADD213NEPBF16Z256m, 0},
- {X86::VFMADD213NEPBF16Zr, X86::VFMADD213NEPBF16Zm, 0},
+ {X86::VFMADD213BF16Z128r, X86::VFMADD213BF16Z128m, 0},
+ {X86::VFMADD213BF16Z256r, X86::VFMADD213BF16Z256m, 0},
+ {X86::VFMADD213BF16Zr, X86::VFMADD213BF16Zm, 0},
{X86::VFMADD213PDYr, X86::VFMADD213PDYm, 0},
{X86::VFMADD213PDZ128r, X86::VFMADD213PDZ128m, 0},
{X86::VFMADD213PDZ256r, X86::VFMADD213PDZ256m, 0},
@@ -4652,9 +4652,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VFMADD213SSZr_Int, X86::VFMADD213SSZm_Int, TB_NO_REVERSE},
{X86::VFMADD213SSr, X86::VFMADD213SSm, 0},
{X86::VFMADD213SSr_Int, X86::VFMADD213SSm_Int, TB_NO_REVERSE},
- {X86::VFMADD231NEPBF16Z128r, X86::VFMADD231NEPBF16Z128m, 0},
- {X86::VFMADD231NEPBF16Z256r, X86::VFMADD231NEPBF16Z256m, 0},
- {X86::VFMADD231NEPBF16Zr, X86::VFMADD231NEPBF16Zm, 0},
+ {X86::VFMADD231BF16Z128r, X86::VFMADD231BF16Z128m, 0},
+ {X86::VFMADD231BF16Z256r, X86::VFMADD231BF16Z256m, 0},
+ {X86::VFMADD231BF16Zr, X86::VFMADD231BF16Zm, 0},
{X86::VFMADD231PDYr, X86::VFMADD231PDYm, 0},
{X86::VFMADD231PDZ128r, X86::VFMADD231PDZ128m, 0},
{X86::VFMADD231PDZ256r, X86::VFMADD231PDZ256m, 0},
@@ -4733,9 +4733,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VFMADDSUBPD4rr, X86::VFMADDSUBPD4rm, 0},
{X86::VFMADDSUBPS4Yrr, X86::VFMADDSUBPS4Yrm, 0},
{X86::VFMADDSUBPS4rr, X86::VFMADDSUBPS4rm, 0},
- {X86::VFMSUB132NEPBF16Z128r, X86::VFMSUB132NEPBF16Z128m, 0},
- {X86::VFMSUB132NEPBF16Z256r, X86::VFMSUB132NEPBF16Z256m, 0},
- {X86::VFMSUB132NEPBF16Zr, X86::VFMSUB132NEPBF16Zm, 0},
+ {X86::VFMSUB132BF16Z128r, X86::VFMSUB132BF16Z128m, 0},
+ {X86::VFMSUB132BF16Z256r, X86::VFMSUB132BF16Z256m, 0},
+ {X86::VFMSUB132BF16Zr, X86::VFMSUB132BF16Zm, 0},
{X86::VFMSUB132PDYr, X86::VFMSUB132PDYm, 0},
{X86::VFMSUB132PDZ128r, X86::VFMSUB132PDZ128m, 0},
{X86::VFMSUB132PDZ256r, X86::VFMSUB132PDZ256m, 0},
@@ -4759,9 +4759,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VFMSUB132SSZr_Int, X86::VFMSUB132SSZm_Int, TB_NO_REVERSE},
{X86::VFMSUB132SSr, X86::VFMSUB132SSm, 0},
{X86::VFMSUB132SSr_Int, X86::VFMSUB132SSm_Int, TB_NO_REVERSE},
- {X86::VFMSUB213NEPBF16Z128r, X86::VFMSUB213NEPBF16Z128m, 0},
- {X86::VFMSUB213NEPBF16Z256r, X86::VFMSUB213NEPBF16Z256m, 0},
- {X86::VFMSUB213NEPBF16Zr, X86::VFMSUB213NEPBF16Zm, 0},
+ {X86::VFMSUB213BF16Z128r, X86::VFMSUB213BF16Z128m, 0},
+ {X86::VFMSUB213BF16Z256r, X86::VFMSUB213BF16Z256m, 0},
+ {X86::VFMSUB213BF16Zr, X86::VFMSUB213BF16Zm, 0},
{X86::VFMSUB213PDYr, X86::VFMSUB213PDYm, 0},
{X86::VFMSUB213PDZ128r, X86::VFMSUB213PDZ128m, 0},
{X86::VFMSUB213PDZ256r, X86::VFMSUB213PDZ256m, 0},
@@ -4785,9 +4785,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VFMSUB213SSZr_Int, X86::VFMSUB213SSZm_Int, TB_NO_REVERSE},
{X86::VFMSUB213SSr, X86::VFMSUB213SSm, 0},
{X86::VFMSUB213SSr_Int, X86::VFMSUB213SSm_Int, TB_NO_REVERSE},
- {X86::VFMSUB231NEPBF16Z128r, X86::VFMSUB231NEPBF16Z128m, 0},
- {X86::VFMSUB231NEPBF16Z256r, X86::VFMSUB231NEPBF16Z256m, 0},
- {X86::VFMSUB231NEPBF16Zr, X86::VFMSUB231NEPBF16Zm, 0},
+ {X86::VFMSUB231BF16Z128r, X86::VFMSUB231BF16Z128m, 0},
+ {X86::VFMSUB231BF16Z256r, X86::VFMSUB231BF16Z256m, 0},
+ {X86::VFMSUB231BF16Zr, X86::VFMSUB231BF16Zm, 0},
{X86::VFMSUB231PDYr, X86::VFMSUB231PDYm, 0},
{X86::VFMSUB231PDZ128r, X86::VFMSUB231PDZ128m, 0},
{X86::VFMSUB231PDZ256r, X86::VFMSUB231PDZ256m, 0},
@@ -4866,9 +4866,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VFMULCPHZ256rrkz, X86::VFMULCPHZ256rmkz, 0},
{X86::VFMULCPHZrrkz, X86::VFMULCPHZrmkz, 0},
{X86::VFMULCSHZrrkz, X86::VFMULCSHZrmkz, TB_NO_REVERSE},
- {X86::VFNMADD132NEPBF16Z128r, X86::VFNMADD132NEPBF16Z128m, 0},
- {X86::VFNMADD132NEPBF16Z256r, X86::VFNMADD132NEPBF16Z256m, 0},
- {X86::VFNMADD132NEPBF16Zr, X86::VFNMADD132NEPBF16Zm, 0},
+ {X86::VFNMADD132BF16Z128r, X86::VFNMADD132BF16Z128m, 0},
+ {X86::VFNMADD132BF16Z256r, X86::VFNMADD132BF16Z256m, 0},
+ {X86::VFNMADD132BF16Zr, X86::VFNMADD132BF16Zm, 0},
{X86::VFNMADD132PDYr, X86::VFNMADD132PDYm, 0},
{X86::VFNMADD132PDZ128r, X86::VFNMADD132PDZ128m, 0},
{X86::VFNMADD132PDZ256r, X86::VFNMADD132PDZ256m, 0},
@@ -4892,9 +4892,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VFNMADD132SSZr_Int, X86::VFNMADD132SSZm_Int, TB_NO_REVERSE},
{X86::VFNMADD132SSr, X86::VFNMADD132SSm, 0},
{X86::VFNMADD132SSr_Int, X86::VFNMADD132SSm_Int, TB_NO_REVERSE},
- {X86::VFNMADD213NEPBF16Z128r, X86::VFNMADD213NEPBF16Z128m, 0},
- {X86::VFNMADD213NEPBF16Z256r, X86::VFNMADD213NEPBF16Z256m, 0},
- {X86::VFNMADD213NEPBF16Zr, X86::VFNMADD213NEPBF16Zm, 0},
+ {X86::VFNMADD213BF16Z128r, X86::VFNMADD213BF16Z128m, 0},
+ {X86::VFNMADD213BF16Z256r, X86::VFNMADD213BF16Z256m, 0},
+ {X86::VFNMADD213BF16Zr, X86::VFNMADD213BF16Zm, 0},
{X86::VFNMADD213PDYr, X86::VFNMADD213PDYm, 0},
{X86::VFNMADD213PDZ128r, X86::VFNMADD213PDZ128m, 0},
{X86::VFNMADD213PDZ256r, X86::VFNMADD213PDZ256m, 0},
@@ -4918,9 +4918,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VFNMADD213SSZr_Int, X86::VFNMADD213SSZm_Int, TB_NO_REVERSE},
{X86::VFNMADD213SSr, X86::VFNMADD213SSm, 0},
{X86::VFNMADD213SSr_Int, X86::VFNMADD213SSm_Int, TB_NO_REVERSE},
- {X86::VFNMADD231NEPBF16Z128r, X86::VFNMADD231NEPBF16Z128m, 0},
- {X86::VFNMADD231NEPBF16Z256r, X86::VFNMADD231NEPBF16Z256m, 0},
- {X86::VFNMADD231NEPBF16Zr, X86::VFNMADD231NEPBF16Zm, 0},
+ {X86::VFNMADD231BF16Z128r, X86::VFNMADD231BF16Z128m, 0},
+ {X86::VFNMADD231BF16Z256r, X86::VFNMADD231BF16Z256m, 0},
+ {X86::VFNMADD231BF16Zr, X86::VFNMADD231BF16Zm, 0},
{X86::VFNMADD231PDYr, X86::VFNMADD231PDYm, 0},
{X86::VFNMADD231PDZ128r, X86::VFNMADD231PDZ128m, 0},
{X86::VFNMADD231PDZ256r, X86::VFNMADD231PDZ256m, 0},
@@ -4952,9 +4952,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VFNMADDSD4rr_Int, X86::VFNMADDSD4rm_Int, TB_NO_REVERSE},
{X86::VFNMADDSS4rr, X86::VFNMADDSS4rm, 0},
{X86::VFNMADDSS4rr_Int, X86::VFNMADDSS4rm_Int, TB_NO_REVERSE},
- {X86::VFNMSUB132NEPBF16Z128r, X86::VFNMSUB132NEPBF16Z128m, 0},
- {X86::VFNMSUB132NEPBF16Z256r, X86::VFNMSUB132NEPBF16Z256m, 0},
- {X86::VFNMSUB132NEPBF16Zr, X86::VFNMSUB132NEPBF16Zm, 0},
+ {X86::VFNMSUB132BF16Z128r, X86::VFNMSUB132BF16Z128m, 0},
+ {X86::VFNMSUB132BF16Z256r, X86::VFNMSUB132BF16Z256m, 0},
+ {X86::VFNMSUB132BF16Zr, X86::VFNMSUB132BF16Zm, 0},
{X86::VFNMSUB132PDYr, X86::VFNMSUB132PDYm, 0},
{X86::VFNMSUB132PDZ128r, X86::VFNMSUB132PDZ128m, 0},
{X86::VFNMSUB132PDZ256r, X86::VFNMSUB132PDZ256m, 0},
@@ -4978,9 +4978,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VFNMSUB132SSZr_Int, X86::VFNMSUB132SSZm_Int, TB_NO_REVERSE},
{X86::VFNMSUB132SSr, X86::VFNMSUB132SSm, 0},
{X86::VFNMSUB132SSr_Int, X86::VFNMSUB132SSm_Int, TB_NO_REVERSE},
- {X86::VFNMSUB213NEPBF16Z128r, X86::VFNMSUB213NEPBF16Z128m, 0},
- {X86::VFNMSUB213NEPBF16Z256r, X86::VFNMSUB213NEPBF16Z256m, 0},
- {X86::VFNMSUB213NEPBF16Zr, X86::VFNMSUB213NEPBF16Zm, 0},
+ {X86::VFNMSUB213BF16Z128r, X86::VFNMSUB213BF16Z128m, 0},
+ {X86::VFNMSUB213BF16Z256r, X86::VFNMSUB213BF16Z256m, 0},
+ {X86::VFNMSUB213BF16Zr, X86::VFNMSUB213BF16Zm, 0},
{X86::VFNMSUB213PDYr, X86::VFNMSUB213PDYm, 0},
{X86::VFNMSUB213PDZ128r, X86::VFNMSUB213PDZ128m, 0},
{X86::VFNMSUB213PDZ256r, X86::VFNMSUB213PDZ256m, 0},
@@ -5004,9 +5004,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VFNMSUB213SSZr_Int, X86::VFNMSUB213SSZm_Int, TB_NO_REVERSE},
{X86::VFNMSUB213SSr, X86::VFNMSUB213SSm, 0},
{X86::VFNMSUB213SSr_Int, X86::VFNMSUB213SSm_Int, TB_NO_REVERSE},
- {X86::VFNMSUB231NEPBF16Z128r, X86::VFNMSUB231NEPBF16Z128m, 0},
- {X86::VFNMSUB231NEPBF16Z256r, X86::VFNMSUB231NEPBF16Z256m, 0},
- {X86::VFNMSUB231NEPBF16Zr, X86::VFNMSUB231NEPBF16Zm, 0},
+ {X86::VFNMSUB231BF16Z128r, X86::VFNMSUB231BF16Z128m, 0},
+ {X86::VFNMSUB231BF16Z256r, X86::VFNMSUB231BF16Z256m, 0},
+ {X86::VFNMSUB231BF16Zr, X86::VFNMSUB231BF16Zm, 0},
{X86::VFNMSUB231PDYr, X86::VFNMSUB231PDYm, 0},
{X86::VFNMSUB231PDZ128r, X86::VFNMSUB231PDZ128m, 0},
{X86::VFNMSUB231PDZ256r, X86::VFNMSUB231PDZ256m, 0},
@@ -5038,9 +5038,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VFNMSUBSD4rr_Int, X86::VFNMSUBSD4rm_Int, TB_NO_REVERSE},
{X86::VFNMSUBSS4rr, X86::VFNMSUBSS4rm, 0},
{X86::VFNMSUBSS4rr_Int, X86::VFNMSUBSS4rm_Int, TB_NO_REVERSE},
- {X86::VGETEXPPBF16Z128rk, X86::VGETEXPPBF16Z128mk, 0},
- {X86::VGETEXPPBF16Z256rk, X86::VGETEXPPBF16Z256mk, 0},
- {X86::VGETEXPPBF16Zrk, X86::VGETEXPPBF16Zmk, 0},
+ {X86::VGETEXPBF16Z128rk, X86::VGETEXPBF16Z128mk, 0},
+ {X86::VGETEXPBF16Z256rk, X86::VGETEXPBF16Z256mk, 0},
+ {X86::VGETEXPBF16Zrk, X86::VGETEXPBF16Zmk, 0},
{X86::VGETEXPPDZ128rk, X86::VGETEXPPDZ128mk, 0},
{X86::VGETEXPPDZ256rk, X86::VGETEXPPDZ256mk, 0},
{X86::VGETEXPPDZrk, X86::VGETEXPPDZmk, 0},
@@ -5053,9 +5053,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VGETEXPSDZrkz, X86::VGETEXPSDZmkz, TB_NO_REVERSE},
{X86::VGETEXPSHZrkz, X86::VGETEXPSHZmkz, TB_NO_REVERSE},
{X86::VGETEXPSSZrkz, X86::VGETEXPSSZmkz, TB_NO_REVERSE},
- {X86::VGETMANTPBF16Z128rrik, X86::VGETMANTPBF16Z128rmik, 0},
- {X86::VGETMANTPBF16Z256rrik, X86::VGETMANTPBF16Z256rmik, 0},
- {X86::VGETMANTPBF16Zrrik, X86::VGETMANTPBF16Zrmik, 0},
+ {X86::VGETMANTBF16Z128rrik, X86::VGETMANTBF16Z128rmik, 0},
+ {X86::VGETMANTBF16Z256rrik, X86::VGETMANTBF16Z256rmik, 0},
+ {X86::VGETMANTBF16Zrrik, X86::VGETMANTBF16Zrmik, 0},
{X86::VGETMANTPDZ128rrik, X86::VGETMANTPDZ128rmik, 0},
{X86::VGETMANTPDZ256rrik, X86::VGETMANTPDZ256rmik, 0},
{X86::VGETMANTPDZrrik, X86::VGETMANTPDZrmik, 0},
@@ -5089,6 +5089,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VINSERTI64X2Z256rrikz, X86::VINSERTI64X2Z256rmikz, 0},
{X86::VINSERTI64X2Zrrikz, X86::VINSERTI64X2Zrmikz, 0},
{X86::VINSERTI64X4Zrrikz, X86::VINSERTI64X4Zrmikz, 0},
+ {X86::VMAXBF16Z128rrkz, X86::VMAXBF16Z128rmkz, 0},
+ {X86::VMAXBF16Z256rrkz, X86::VMAXBF16Z256rmkz, 0},
+ {X86::VMAXBF16Zrrkz, X86::VMAXBF16Zrmkz, 0},
{X86::VMAXCPDZ128rrkz, X86::VMAXCPDZ128rmkz, 0},
{X86::VMAXCPDZ256rrkz, X86::VMAXCPDZ256rmkz, 0},
{X86::VMAXCPDZrrkz, X86::VMAXCPDZrmkz, 0},
@@ -5098,9 +5101,6 @@ static const X86FoldTableEntry Table3[] = {
{X86::VMAXCPSZ128rrkz, X86::VMAXCPSZ128rmkz, 0},
{X86::VMAXCPSZ256rrkz, X86::VMAXCPSZ256rmkz, 0},
{X86::VMAXCPSZrrkz, X86::VMAXCPSZrmkz, 0},
- {X86::VMAXPBF16Z128rrkz, X86::VMAXPBF16Z128rmkz, 0},
- {X86::VMAXPBF16Z256rrkz, X86::VMAXPBF16Z256rmkz, 0},
- {X86::VMAXPBF16Zrrkz, X86::VMAXPBF16Zrmkz, 0},
{X86::VMAXPDZ128rrkz, X86::VMAXPDZ128rmkz, 0},
{X86::VMAXPDZ256rrkz, X86::VMAXPDZ256rmkz, 0},
{X86::VMAXPDZrrkz, X86::VMAXPDZrmkz, 0},
@@ -5113,6 +5113,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VMAXSDZrrkz_Int, X86::VMAXSDZrmkz_Int, TB_NO_REVERSE},
{X86::VMAXSHZrrkz_Int, X86::VMAXSHZrmkz_Int, TB_NO_REVERSE},
{X86::VMAXSSZrrkz_Int, X86::VMAXSSZrmkz_Int, TB_NO_REVERSE},
+ {X86::VMINBF16Z128rrkz, X86::VMINBF16Z128rmkz, 0},
+ {X86::VMINBF16Z256rrkz, X86::VMINBF16Z256rmkz, 0},
+ {X86::VMINBF16Zrrkz, X86::VMINBF16Zrmkz, 0},
{X86::VMINCPDZ128rrkz, X86::VMINCPDZ128rmkz, 0},
{X86::VMINCPDZ256rrkz, X86::VMINCPDZ256rmkz, 0},
{X86::VMINCPDZrrkz, X86::VMINCPDZrmkz, 0},
@@ -5137,9 +5140,6 @@ static const X86FoldTableEntry Table3[] = {
{X86::VMINMAXSDrrikz_Int, X86::VMINMAXSDrmikz_Int, TB_NO_REVERSE},
{X86::VMINMAXSHrrikz_Int, X86::VMINMAXSHrmikz_Int, TB_NO_REVERSE},
{X86::VMINMAXSSrrikz_Int, X86::VMINMAXSSrmikz_Int, TB_NO_REVERSE},
- {X86::VMINPBF16Z128rrkz, X86::VMINPBF16Z128rmkz, 0},
- {X86::VMINPBF16Z256rrkz, X86::VMINPBF16Z256rmkz, 0},
- {X86::VMINPBF16Zrrkz, X86::VMINPBF16Zrmkz, 0},
{X86::VMINPDZ128rrkz, X86::VMINPDZ128rmkz, 0},
{X86::VMINPDZ256rrkz, X86::VMINPDZ256rmkz, 0},
{X86::VMINPDZrrkz, X86::VMINPDZrmkz, 0},
@@ -5194,9 +5194,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VMPSADBWZ128rrikz, X86::VMPSADBWZ128rmikz, 0},
{X86::VMPSADBWZ256rrikz, X86::VMPSADBWZ256rmikz, 0},
{X86::VMPSADBWZrrikz, X86::VMPSADBWZrmikz, 0},
- {X86::VMULNEPBF16Z128rrkz, X86::VMULNEPBF16Z128rmkz, 0},
- {X86::VMULNEPBF16Z256rrkz, X86::VMULNEPBF16Z256rmkz, 0},
- {X86::VMULNEPBF16Zrrkz, X86::VMULNEPBF16Zrmkz, 0},
+ {X86::VMULBF16Z128rrkz, X86::VMULBF16Z128rmkz, 0},
+ {X86::VMULBF16Z256rrkz, X86::VMULBF16Z256rmkz, 0},
+ {X86::VMULBF16Zrrkz, X86::VMULBF16Zrmkz, 0},
{X86::VMULPDZ128rrkz, X86::VMULPDZ128rmkz, 0},
{X86::VMULPDZ256rrkz, X86::VMULPDZ256rmkz, 0},
{X86::VMULPDZrrkz, X86::VMULPDZrmkz, 0},
@@ -5938,16 +5938,16 @@ static const X86FoldTableEntry Table3[] = {
{X86::VRCP28PSZrk, X86::VRCP28PSZmk, 0},
{X86::VRCP28SDZrkz, X86::VRCP28SDZmkz, TB_NO_REVERSE},
{X86::VRCP28SSZrkz, X86::VRCP28SSZmkz, TB_NO_REVERSE},
- {X86::VRCPPBF16Z128rk, X86::VRCPPBF16Z128mk, 0},
- {X86::VRCPPBF16Z256rk, X86::VRCPPBF16Z256mk, 0},
- {X86::VRCPPBF16Zrk, X86::VRCPPBF16Zmk, 0},
+ {X86::VRCPBF16Z128rk, X86::VRCPBF16Z128mk, 0},
+ {X86::VRCPBF16Z256rk, X86::VRCPBF16Z256mk, 0},
+ {X86::VRCPBF16Zrk, X86::VRCPBF16Zmk, 0},
{X86::VRCPPHZ128rk, X86::VRCPPHZ128mk, 0},
{X86::VRCPPHZ256rk, X86::VRCPPHZ256mk, 0},
{X86::VRCPPHZrk, X86::VRCPPHZmk, 0},
{X86::VRCPSHZrrkz, X86::VRCPSHZrmkz, TB_NO_REVERSE},
- {X86::VREDUCENEPBF16Z128rrik, X86::VREDUCENEPBF16Z128rmik, 0},
- {X86::VREDUCENEPBF16Z256rrik, X86::VREDUCENEPBF16Z256rmik, 0},
- {X86::VREDUCENEPBF16Zrrik, X86::VREDUCENEPBF16Zrmik, 0},
+ {X86::VREDUCEBF16Z128rrik, X86::VREDUCEBF16Z128rmik, 0},
+ {X86::VREDUCEBF16Z256rrik, X86::VREDUCEBF16Z256rmik, 0},
+ {X86::VREDUCEBF16Zrrik, X86::VREDUCEBF16Zrmik, 0},
{X86::VREDUCEPDZ128rrik, X86::VREDUCEPDZ128rmik, 0},
{X86::VREDUCEPDZ256rrik, X86::VREDUCEPDZ256rmik, 0},
{X86::VREDUCEPDZrrik, X86::VREDUCEPDZrmik, 0},
@@ -5960,9 +5960,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VREDUCESDZrrikz, X86::VREDUCESDZrmikz, TB_NO_REVERSE},
{X86::VREDUCESHZrrikz, X86::VREDUCESHZrmikz, TB_NO_REVERSE},
{X86::VREDUCESSZrrikz, X86::VREDUCESSZrmikz, TB_NO_REVERSE},
- {X86::VRNDSCALENEPBF16Z128rrik, X86::VRNDSCALENEPBF16Z128rmik, 0},
- {X86::VRNDSCALENEPBF16Z256rrik, X86::VRNDSCALENEPBF16Z256rmik, 0},
- {X86::VRNDSCALENEPBF16Zrrik, X86::VRNDSCALENEPBF16Zrmik, 0},
+ {X86::VRNDSCALEBF16Z128rrik, X86::VRNDSCALEBF16Z128rmik, 0},
+ {X86::VRNDSCALEBF16Z256rrik, X86::VRNDSCALEBF16Z256rmik, 0},
+ {X86::VRNDSCALEBF16Zrrik, X86::VRNDSCALEBF16Zrmik, 0},
{X86::VRNDSCALEPDZ128rrik, X86::VRNDSCALEPDZ128rmik, 0},
{X86::VRNDSCALEPDZ256rrik, X86::VRNDSCALEPDZ256rmik, 0},
{X86::VRNDSCALEPDZrrik, X86::VRNDSCALEPDZrmik, 0},
@@ -5987,16 +5987,16 @@ static const X86FoldTableEntry Table3[] = {
{X86::VRSQRT28PSZrk, X86::VRSQRT28PSZmk, 0},
{X86::VRSQRT28SDZrkz, X86::VRSQRT28SDZmkz, TB_NO_REVERSE},
{X86::VRSQRT28SSZrkz, X86::VRSQRT28SSZmkz, TB_NO_REVERSE},
- {X86::VRSQRTPBF16Z128rk, X86::VRSQRTPBF16Z128mk, 0},
- {X86::VRSQRTPBF16Z256rk, X86::VRSQRTPBF16Z256mk, 0},
- {X86::VRSQRTPBF16Zrk, X86::VRSQRTPBF16Zmk, 0},
+ {X86::VRSQRTBF16Z128rk, X86::VRSQRTBF16Z128mk, 0},
+ {X86::VRSQRTBF16Z256rk, X86::VRSQRTBF16Z256mk, 0},
+ {X86::VRSQRTBF16Zrk, X86::VRSQRTBF16Zmk, 0},
{X86::VRSQRTPHZ128rk, X86::VRSQRTPHZ128mk, 0},
{X86::VRSQRTPHZ256rk, X86::VRSQRTPHZ256mk, 0},
{X86::VRSQRTPHZrk, X86::VRSQRTPHZmk, 0},
{X86::VRSQRTSHZrrkz, X86::VRSQRTSHZrmkz, TB_NO_REVERSE},
- {X86::VSCALEFPBF16Z128rrkz, X86::VSCALEFPBF16Z128rmkz, 0},
- {X86::VSCALEFPBF16Z256rrkz, X86::VSCALEFPBF16Z256rmkz, 0},
- {X86::VSCALEFPBF16Zrrkz, X86::VSCALEFPBF16Zrmkz, 0},
+ {X86::VSCALEFBF16Z128rrkz, X86::VSCALEFBF16Z128rmkz, 0},
+ {X86::VSCALEFBF16Z256rrkz, X86::VSCALEFBF16Z256rmkz, 0},
+ {X86::VSCALEFBF16Zrrkz, X86::VSCALEFBF16Zrmkz, 0},
{X86::VSCALEFPDZ128rrkz, X86::VSCALEFPDZ128rmkz, 0},
{X86::VSCALEFPDZ256rrkz, X86::VSCALEFPDZ256rmkz, 0},
{X86::VSCALEFPDZrrkz, X86::VSCALEFPDZrmkz, 0},
@@ -6026,9 +6026,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VSM3MSG1rr, X86::VSM3MSG1rm, 0},
{X86::VSM3MSG2rr, X86::VSM3MSG2rm, 0},
{X86::VSM3RNDS2rr, X86::VSM3RNDS2rm, 0},
- {X86::VSQRTNEPBF16Z128rk, X86::VSQRTNEPBF16Z128mk, 0},
- {X86::VSQRTNEPBF16Z256rk, X86::VSQRTNEPBF16Z256mk, 0},
- {X86::VSQRTNEPBF16Zrk, X86::VSQRTNEPBF16Zmk, 0},
+ {X86::VSQRTBF16Z128rk, X86::VSQRTBF16Z128mk, 0},
+ {X86::VSQRTBF16Z256rk, X86::VSQRTBF16Z256mk, 0},
+ {X86::VSQRTBF16Zrk, X86::VSQRTBF16Zmk, 0},
{X86::VSQRTPDZ128rk, X86::VSQRTPDZ128mk, 0},
{X86::VSQRTPDZ256rk, X86::VSQRTPDZ256mk, 0},
{X86::VSQRTPDZrk, X86::VSQRTPDZmk, 0},
@@ -6041,9 +6041,9 @@ static const X86FoldTableEntry Table3[] = {
{X86::VSQRTSDZrkz_Int, X86::VSQRTSDZmkz_Int, TB_NO_REVERSE},
{X86::VSQRTSHZrkz_Int, X86::VSQRTSHZmkz_Int, TB_NO_REVERSE},
{X86::VSQRTSSZrkz_Int, X86::VSQRTSSZmkz_Int, TB_NO_REVERSE},
- {X86::VSUBNEPBF16Z128rrkz, X86::VSUBNEPBF16Z128rmkz, 0},
- {X86::VSUBNEPBF16Z256rrkz, X86::VSUBNEPBF16Z256rmkz, 0},
- {X86::VSUBNEPBF16Zrrkz, X86::VSUBNEPBF16Zrmkz, 0},
+ {X86::VSUBBF16Z128rrkz, X86::VSUBBF16Z128rmkz, 0},
+ {X86::VSUBBF16Z256rrkz, X86::VSUBBF16Z256rmkz, 0},
+ {X86::VSUBBF16Zrrkz, X86::VSUBBF16Zrmkz, 0},
{X86::VSUBPDZ128rrkz, X86::VSUBPDZ128rmkz, 0},
{X86::VSUBPDZ256rrkz, X86::VSUBPDZ256rmkz, 0},
{X86::VSUBPDZrrkz, X86::VSUBPDZrmkz, 0},
@@ -6077,9 +6077,9 @@ static const X86FoldTableEntry Table3[] = {
};
static const X86FoldTableEntry Table4[] = {
- {X86::VADDNEPBF16Z128rrk, X86::VADDNEPBF16Z128rmk, 0},
- {X86::VADDNEPBF16Z256rrk, X86::VADDNEPBF16Z256rmk, 0},
- {X86::VADDNEPBF16Zrrk, X86::VADDNEPBF16Zrmk, 0},
+ {X86::VADDBF16Z128rrk, X86::VADDBF16Z128rmk, 0},
+ {X86::VADDBF16Z256rrk, X86::VADDBF16Z256rmk, 0},
+ {X86::VADDBF16Zrrk, X86::VADDBF16Zrmk, 0},
{X86::VADDPDZ128rrk, X86::VADDPDZ128rmk, 0},
{X86::VADDPDZ256rrk, X86::VADDPDZ256rmk, 0},
{X86::VADDPDZrrk, X86::VADDPDZrmk, 0},
@@ -6149,9 +6149,9 @@ static const X86FoldTableEntry Table4[] = {
{X86::VDBPSADBWZ128rrik, X86::VDBPSADBWZ128rmik, 0},
{X86::VDBPSADBWZ256rrik, X86::VDBPSADBWZ256rmik, 0},
{X86::VDBPSADBWZrrik, X86::VDBPSADBWZrmik, 0},
- {X86::VDIVNEPBF16Z128rrk, X86::VDIVNEPBF16Z128rmk, 0},
- {X86::VDIVNEPBF16Z256rrk, X86::VDIVNEPBF16Z256rmk, 0},
- {X86::VDIVNEPBF16Zrrk, X86::VDIVNEPBF16Zrmk, 0},
+ {X86::VDIVBF16Z128rrk, X86::VDIVBF16Z128rmk, 0},
+ {X86::VDIVBF16Z256rrk, X86::VDIVBF16Z256rmk, 0},
+ {X86::VDIVBF16Zrrk, X86::VDIVBF16Zrmk, 0},
{X86::VDIVPDZ128rrk, X86::VDIVPDZ128rmk, 0},
{X86::VDIVPDZ256rrk, X86::VDIVPDZ256rmk, 0},
{X86::VDIVPDZrrk, X86::VDIVPDZrmk, 0},
@@ -6204,12 +6204,12 @@ static const X86FoldTableEntry Table4[] = {
{X86::VFIXUPIMMSDZrrikz, X86::VFIXUPIMMSDZrmikz, TB_NO_REVERSE},
{X86::VFIXUPIMMSSZrrik, X86::VFIXUPIMMSSZrmik, TB_NO_REVERSE},
{X86::VFIXUPIMMSSZrrikz, X86::VFIXUPIMMSSZrmikz, TB_NO_REVERSE},
- {X86::VFMADD132NEPBF16Z128rk, X86::VFMADD132NEPBF16Z128mk, 0},
- {X86::VFMADD132NEPBF16Z128rkz, X86::VFMADD132NEPBF16Z128mkz, 0},
- {X86::VFMADD132NEPBF16Z256rk, X86::VFMADD132NEPBF16Z256mk, 0},
- {X86::VFMADD132NEPBF16Z256rkz, X86::VFMADD132NEPBF16Z256mkz, 0},
- {X86::VFMADD132NEPBF16Zrk, X86::VFMADD132NEPBF16Zmk, 0},
- {X86::VFMADD132NEPBF16Zrkz, X86::VFMADD132NEPBF16Zmkz, 0},
+ {X86::VFMADD132BF16Z128rk, X86::VFMADD132BF16Z128mk, 0},
+ {X86::VFMADD132BF16Z128rkz, X86::VFMADD132BF16Z128mkz, 0},
+ {X86::VFMADD132BF16Z256rk, X86::VFMADD132BF16Z256mk, 0},
+ {X86::VFMADD132BF16Z256rkz, X86::VFMADD132BF16Z256mkz, 0},
+ {X86::VFMADD132BF16Zrk, X86::VFMADD132BF16Zmk, 0},
+ {X86::VFMADD132BF16Zrkz, X86::VFMADD132BF16Zmkz, 0},
{X86::VFMADD132PDZ128rk, X86::VFMADD132PDZ128mk, 0},
{X86::VFMADD132PDZ128rkz, X86::VFMADD132PDZ128mkz, 0},
{X86::VFMADD132PDZ256rk, X86::VFMADD132PDZ256mk, 0},
@@ -6234,12 +6234,12 @@ static const X86FoldTableEntry Table4[] = {
{X86::VFMADD132SHZrkz_Int, X86::VFMADD132SHZmkz_Int, TB_NO_REVERSE},
{X86::VFMADD132SSZrk_Int, X86::VFMADD132SSZmk_Int, TB_NO_REVERSE},
{X86::VFMADD132SSZrkz_Int, X86::VFMADD132SSZmkz_Int, TB_NO_REVERSE},
- {X86::VFMADD213NEPBF16Z128rk, X86::VFMADD213NEPBF16Z128mk, 0},
- {X86::VFMADD213NEPBF16Z128rkz, X86::VFMADD213NEPBF16Z128mkz, 0},
- {X86::VFMADD213NEPBF16Z256rk, X86::VFMADD213NEPBF16Z256mk, 0},
- {X86::VFMADD213NEPBF16Z256rkz, X86::VFMADD213NEPBF16Z256mkz, 0},
- {X86::VFMADD213NEPBF16Zrk, X86::VFMADD213NEPBF16Zmk, 0},
- {X86::VFMADD213NEPBF16Zrkz, X86::VFMADD213NEPBF16Zmkz, 0},
+ {X86::VFMADD213BF16Z128rk, X86::VFMADD213BF16Z128mk, 0},
+ {X86::VFMADD213BF16Z128rkz, X86::VFMADD213BF16Z128mkz, 0},
+ {X86::VFMADD213BF16Z256rk, X86::VFMADD213BF16Z256mk, 0},
+ {X86::VFMADD213BF16Z256rkz, X86::VFMADD213BF16Z256mkz, 0},
+ {X86::VFMADD213BF16Zrk, X86::VFMADD213BF16Zmk, 0},
+ {X86::VFMADD213BF16Zrkz, X86::VFMADD213BF16Zmkz, 0},
{X86::VFMADD213PDZ128rk, X86::VFMADD213PDZ128mk, 0},
{X86::VFMADD213PDZ128rkz, X86::VFMADD213PDZ128mkz, 0},
{X86::VFMADD213PDZ256rk, X86::VFMADD213PDZ256mk, 0},
@@ -6264,12 +6264,12 @@ static const X86FoldTableEntry Table4[] = {
{X86::VFMADD213SHZrkz_Int, X86::VFMADD213SHZmkz_Int, TB_NO_REVERSE},
{X86::VFMADD213SSZrk_Int, X86::VFMADD213SSZmk_Int, TB_NO_REVERSE},
{X86::VFMADD213SSZrkz_Int, X86::VFMADD213SSZmkz_Int, TB_NO_REVERSE},
- {X86::VFMADD231NEPBF16Z128rk, X86::VFMADD231NEPBF16Z128mk, 0},
- {X86::VFMADD231NEPBF16Z128rkz, X86::VFMADD231NEPBF16Z128mkz, 0},
- {X86::VFMADD231NEPBF16Z256rk, X86::VFMADD231NEPBF16Z256mk, 0},
- {X86::VFMADD231NEPBF16Z256rkz, X86::VFMADD231NEPBF16Z256mkz, 0},
- {X86::VFMADD231NEPBF16Zrk, X86::VFMADD231NEPBF16Zmk, 0},
- {X86::VFMADD231NEPBF16Zrkz, X86::VFMADD231NEPBF16Zmkz, 0},
+ {X86::VFMADD231BF16Z128rk, X86::VFMADD231BF16Z128mk, 0},
+ {X86::VFMADD231BF16Z128rkz, X86::VFMADD231BF16Z128mkz, 0},
+ {X86::VFMADD231BF16Z256rk, X86::VFMADD231BF16Z256mk, 0},
+ {X86::VFMADD231BF16Z256rkz, X86::VFMADD231BF16Z256mkz, 0},
+ {X86::VFMADD231BF16Zrk, X86::VFMADD231BF16Zmk, 0},
+ {X86::VFMADD231BF16Zrkz, X86::VFMADD231BF16Zmkz, 0},
{X86::VFMADD231PDZ128rk, X86::VFMADD231PDZ128mk, 0},
{X86::VFMADD231PDZ128rkz, X86::VFMADD231PDZ128mkz, 0},
{X86::VFMADD231PDZ256rk, X86::VFMADD231PDZ256mk, 0},
@@ -6356,12 +6356,12 @@ static const X86FoldTableEntry Table4[] = {
{X86::VFMADDSUB231PSZ256rkz, X86::VFMADDSUB231PSZ256mkz, 0},
{X86::VFMADDSUB231PSZrk, X86::VFMADDSUB231PSZmk, 0},
{X86::VFMADDSUB231PSZrkz, X86::VFMADDSUB231PSZmkz, 0},
- {X86::VFMSUB132NEPBF16Z128rk, X86::VFMSUB132NEPBF16Z128mk, 0},
- {X86::VFMSUB132NEPBF16Z128rkz, X86::VFMSUB132NEPBF16Z128mkz, 0},
- {X86::VFMSUB132NEPBF16Z256rk, X86::VFMSUB132NEPBF16Z256mk, 0},
- {X86::VFMSUB132NEPBF16Z256rkz, X86::VFMSUB132NEPBF16Z256mkz, 0},
- {X86::VFMSUB132NEPBF16Zrk, X86::VFMSUB132NEPBF16Zmk, 0},
- {X86::VFMSUB132NEPBF16Zrkz, X86::VFMSUB132NEPBF16Zmkz, 0},
+ {X86::VFMSUB132BF16Z128rk, X86::VFMSUB132BF16Z128mk, 0},
+ {X86::VFMSUB132BF16Z128rkz, X86::VFMSUB132BF16Z128mkz, 0},
+ {X86::VFMSUB132BF16Z256rk, X86::VFMSUB132BF16Z256mk, 0},
+ {X86::VFMSUB132BF16Z256rkz, X86::VFMSUB132BF16Z256mkz, 0},
+ {X86::VFMSUB132BF16Zrk, X86::VFMSUB132BF16Zmk, 0},
+ {X86::VFMSUB132BF16Zrkz, X86::VFMSUB132BF16Zmkz, 0},
{X86::VFMSUB132PDZ128rk, X86::VFMSUB132PDZ128mk, 0},
{X86::VFMSUB132PDZ128rkz, X86::VFMSUB132PDZ128mkz, 0},
{X86::VFMSUB132PDZ256rk, X86::VFMSUB132PDZ256mk, 0},
@@ -6386,12 +6386,12 @@ static const X86FoldTableEntry Table4[] = {
{X86::VFMSUB132SHZrkz_Int, X86::VFMSUB132SHZmkz_Int, TB_NO_REVERSE},
{X86::VFMSUB132SSZrk_Int, X86::VFMSUB132SSZmk_Int, TB_NO_REVERSE},
{X86::VFMSUB132SSZrkz_Int, X86::VFMSUB132SSZmkz_Int, TB_NO_REVERSE},
- {X86::VFMSUB213NEPBF16Z128rk, X86::VFMSUB213NEPBF16Z128mk, 0},
- {X86::VFMSUB213NEPBF16Z128rkz, X86::VFMSUB213NEPBF16Z128mkz, 0},
- {X86::VFMSUB213NEPBF16Z256rk, X86::VFMSUB213NEPBF16Z256mk, 0},
- {X86::VFMSUB213NEPBF16Z256rkz, X86::VFMSUB213NEPBF16Z256mkz, 0},
- {X86::VFMSUB213NEPBF16Zrk, X86::VFMSUB213NEPBF16Zmk, 0},
- {X86::VFMSUB213NEPBF16Zrkz, X86::VFMSUB213NEPBF16Zmkz, 0},
+ {X86::VFMSUB213BF16Z128rk, X86::VFMSUB213BF16Z128mk, 0},
+ {X86::VFMSUB213BF16Z128rkz, X86::VFMSUB213BF16Z128mkz, 0},
+ {X86::VFMSUB213BF16Z256rk, X86::VFMSUB213BF16Z256mk, 0},
+ {X86::VFMSUB213BF16Z256rkz, X86::VFMSUB213BF16Z256mkz, 0},
+ {X86::VFMSUB213BF16Zrk, X86::VFMSUB213BF16Zmk, 0},
+ {X86::VFMSUB213BF16Zrkz, X86::VFMSUB213BF16Zmkz, 0},
{X86::VFMSUB213PDZ128rk, X86::VFMSUB213PDZ128mk, 0},
{X86::VFMSUB213PDZ128rkz, X86::VFMSUB213PDZ128mkz, 0},
{X86::VFMSUB213PDZ256rk, X86::VFMSUB213PDZ256mk, 0},
@@ -6416,12 +6416,12 @@ static const X86FoldTableEntry Table4[] = {
{X86::VFMSUB213SHZrkz_Int, X86::VFMSUB213SHZmkz_Int, TB_NO_REVERSE},
{X86::VFMSUB213SSZrk_Int, X86::VFMSUB213SSZmk_Int, TB_NO_REVERSE},
{X86::VFMSUB213SSZrkz_Int, X86::VFMSUB213SSZmkz_Int, TB_NO_REVERSE},
- {X86::VFMSUB231NEPBF16Z128rk, X86::VFMSUB231NEPBF16Z128mk, 0},
- {X86::VFMSUB231NEPBF16Z128rkz, X86::VFMSUB231NEPBF16Z128mkz, 0},
- {X86::VFMSUB231NEPBF16Z256rk, X86::VFMSUB231NEPBF16Z256mk, 0},
- {X86::VFMSUB231NEPBF16Z256rkz, X86::VFMSUB231NEPBF16Z256mkz, 0},
- {X86::VFMSUB231NEPBF16Zrk, X86::VFMSUB231NEPBF16Zmk, 0},
- {X86::VFMSUB231NEPBF16Zrkz, X86::VFMSUB231NEPBF16Zmkz, 0},
+ {X86::VFMSUB231BF16Z128rk, X86::VFMSUB231BF16Z128mk, 0},
+ {X86::VFMSUB231BF16Z128rkz, X86::VFMSUB231BF16Z128mkz, 0},
+ {X86::VFMSUB231BF16Z256rk, X86::VFMSUB231BF16Z256mk, 0},
+ {X86::VFMSUB231BF16Z256rkz, X86::VFMSUB231BF16Z256mkz, 0},
+ {X86::VFMSUB231BF16Zrk, X86::VFMSUB231BF16Zmk, 0},
+ {X86::VFMSUB231BF16Zrkz, X86::VFMSUB231BF16Zmkz, 0},
{X86::VFMSUB231PDZ128rk, X86::VFMSUB231PDZ128mk, 0},
{X86::VFMSUB231PDZ128rkz, X86::VFMSUB231PDZ128mkz, 0},
{X86::VFMSUB231PDZ256rk, X86::VFMSUB231PDZ256mk, 0},
@@ -6504,12 +6504,12 @@ static const X86FoldTableEntry Table4[] = {
{X86::VFMULCPHZ256rrk, X86::VFMULCPHZ256rmk, 0},
{X86::VFMULCPHZrrk, X86::VFMULCPHZrmk, 0},
{X86::VFMULCSHZrrk, X86::VFMULCSHZrmk, TB_NO_REVERSE},
- {X86::VFNMADD132NEPBF16Z128rk, X86::VFNMADD132NEPBF16Z128mk, 0},
- {X86::VFNMADD132NEPBF16Z128rkz, X86::VFNMADD132NEPBF16Z128mkz, 0},
- {X86::VFNMADD132NEPBF16Z256rk, X86::VFNMADD132NEPBF16Z256mk, 0},
- {X86::VFNMADD132NEPBF16Z256rkz, X86::VFNMADD132NEPBF16Z256mkz, 0},
- {X86::VFNMADD132NEPBF16Zrk, X86::VFNMADD132NEPBF16Zmk, 0},
- {X86::VFNMADD132NEPBF16Zrkz, X86::VFNMADD132NEPBF16Zmkz, 0},
+ {X86::VFNMADD132BF16Z128rk, X86::VFNMADD132BF16Z128mk, 0},
+ {X86::VFNMADD132BF16Z128rkz, X86::VFNMADD132BF16Z128mkz, 0},
+ {X86::VFNMADD132BF16Z256rk, X86::VFNMADD132BF16Z256mk, 0},
+ {X86::VFNMADD132BF16Z256rkz, X86::VFNMADD132BF16Z256mkz, 0},
+ {X86::VFNMADD132BF16Zrk, X86::VFNMADD132BF16Zmk, 0},
+ {X86::VFNMADD132BF16Zrkz, X86::VFNMADD132BF16Zmkz, 0},
{X86::VFNMADD132PDZ128rk, X86::VFNMADD132PDZ128mk, 0},
{X86::VFNMADD132PDZ128rkz, X86::VFNMADD132PDZ128mkz, 0},
{X86::VFNMADD132PDZ256rk, X86::VFNMADD132PDZ256mk, 0},
@@ -6534,12 +6534,12 @@ static const X86FoldTableEntry Table4[] = {
{X86::VFNMADD132SHZrkz_Int, X86::VFNMADD132SHZmkz_Int, TB_NO_REVERSE},
{X86::VFNMADD132SSZrk_Int, X86::VFNMADD132SSZmk_Int, TB_NO_REVERSE},
{X86::VFNMADD132SSZrkz_Int, X86::VFNMADD132SSZmkz_Int, TB_NO_REVERSE},
- {X86::VFNMADD213NEPBF16Z128rk, X86::VFNMADD213NEPBF16Z128mk, 0},
- {X86::VFNMADD213NEPBF16Z128rkz, X86::VFNMADD213NEPBF16Z128mkz, 0},
- {X86::VFNMADD213NEPBF16Z256rk, X86::VFNMADD213NEPBF16Z256mk, 0},
- {X86::VFNMADD213NEPBF16Z256rkz, X86::VFNMADD213NEPBF16Z256mkz, 0},
- {X86::VFNMADD213NEPBF16Zrk, X86::VFNMADD213NEPBF16Zmk, 0},
- {X86::VFNMADD213NEPBF16Zrkz, X86::VFNMADD213NEPBF16Zmkz, 0},
+ {X86::VFNMADD213BF16Z128rk, X86::VFNMADD213BF16Z128mk, 0},
+ {X86::VFNMADD213BF16Z128rkz, X86::VFNMADD213BF16Z128mkz, 0},
+ {X86::VFNMADD213BF16Z256rk, X86::VFNMADD213BF16Z256mk, 0},
+ {X86::VFNMADD213BF16Z256rkz, X86::VFNMADD213BF16Z256mkz, 0},
+ {X86::VFNMADD213BF16Zrk, X86::VFNMADD213BF16Zmk, 0},
+ {X86::VFNMADD213BF16Zrkz, X86::VFNMADD213BF16Zmkz, 0},
{X86::VFNMADD213PDZ128rk, X86::VFNMADD213PDZ128mk, 0},
{X86::VFNMADD213PDZ128rkz, X86::VFNMADD213PDZ128mkz, 0},
{X86::VFNMADD213PDZ256rk, X86::VFNMADD213PDZ256mk, 0},
@@ -6564,12 +6564,12 @@ static const X86FoldTableEntry Table4[] = {
{X86::VFNMADD213SHZrkz_Int, X86::VFNMADD213SHZmkz_Int, TB_NO_REVERSE},
{X86::VFNMADD213SSZrk_Int, X86::VFNMADD213SSZmk_Int, TB_NO_REVERSE},
{X86::VFNMADD213SSZrkz_Int, X86::VFNMADD213SSZmkz_Int, TB_NO_REVERSE},
- {X86::VFNMADD231NEPBF16Z128rk, X86::VFNMADD231NEPBF16Z128mk, 0},
- {X86::VFNMADD231NEPBF16Z128rkz, X86::VFNMADD231NEPBF16Z128mkz, 0},
- {X86::VFNMADD231NEPBF16Z256rk, X86::VFNMADD231NEPBF16Z256mk, 0},
- {X86::VFNMADD231NEPBF16Z256rkz, X86::VFNMADD231NEPBF16Z256mkz, 0},
- {X86::VFNMADD231NEPBF16Zrk, X86::VFNMADD231NEPBF16Zmk, 0},
- {X86::VFNMADD231NEPBF16Zrkz, X86::VFNMADD231NEPBF16Zmkz, 0},
+ {X86::VFNMADD231BF16Z128rk, X86::VFNMADD231BF16Z128mk, 0},
+ {X86::VFNMADD231BF16Z128rkz, X86::VFNMADD231BF16Z128mkz, 0},
+ {X86::VFNMADD231BF16Z256rk, X86::VFNMADD231BF16Z256mk, 0},
+ {X86::VFNMADD231BF16Z256rkz, X86::VFNMADD231BF16Z256mkz, 0},
+ {X86::VFNMADD231BF16Zrk, X86::VFNMADD231BF16Zmk, 0},
+ {X86::VFNMADD231BF16Zrkz, X86::VFNMADD231BF16Zmkz, 0},
{X86::VFNMADD231PDZ128rk, X86::VFNMADD231PDZ128mk, 0},
{X86::VFNMADD231PDZ128rkz, X86::VFNMADD231PDZ128mkz, 0},
{X86::VFNMADD231PDZ256rk, X86::VFNMADD231PDZ256mk, 0},
@@ -6594,12 +6594,12 @@ static const X86FoldTableEntry Table4[] = {
{X86::VFNMADD231SHZrkz_Int, X86::VFNMADD231SHZmkz_Int, TB_NO_REVERSE},
{X86::VFNMADD231SSZrk_Int, X86::VFNMADD231SSZmk_Int, TB_NO_REVERSE},
{X86::VFNMADD231SSZrkz_Int, X86::VFNMADD231SSZmkz_Int, TB_NO_REVERSE},
- {X86::VFNMSUB132NEPBF16Z128rk, X86::VFNMSUB132NEPBF16Z128mk, 0},
- {X86::VFNMSUB132NEPBF16Z128rkz, X86::VFNMSUB132NEPBF16Z128mkz, 0},
- {X86::VFNMSUB132NEPBF16Z256rk, X86::VFNMSUB132NEPBF16Z256mk, 0},
- {X86::VFNMSUB132NEPBF16Z256rkz, X86::VFNMSUB132NEPBF16Z256mkz, 0},
- {X86::VFNMSUB132NEPBF16Zrk, X86::VFNMSUB132NEPBF16Zmk, 0},
- {X86::VFNMSUB132NEPBF16Zrkz, X86::VFNMSUB132NEPBF16Zmkz, 0},
+ {X86::VFNMSUB132BF16Z128rk, X86::VFNMSUB132BF16Z128mk, 0},
+ {X86::VFNMSUB132BF16Z128rkz, X86::VFNMSUB132BF16Z128mkz, 0},
+ {X86::VFNMSUB132BF16Z256rk, X86::VFNMSUB132BF16Z256mk, 0},
+ {X86::VFNMSUB132BF16Z256rkz, X86::VFNMSUB132BF16Z256mkz, 0},
+ {X86::VFNMSUB132BF16Zrk, X86::VFNMSUB132BF16Zmk, 0},
+ {X86::VFNMSUB132BF16Zrkz, X86::VFNMSUB132BF16Zmkz, 0},
{X86::VFNMSUB132PDZ128rk, X86::VFNMSUB132PDZ128mk, 0},
{X86::VFNMSUB132PDZ128rkz, X86::VFNMSUB132PDZ128mkz, 0},
{X86::VFNMSUB132PDZ256rk, X86::VFNMSUB132PDZ256mk, 0},
@@ -6624,12 +6624,12 @@ static const X86FoldTableEntry Table4[] = {
{X86::VFNMSUB132SHZrkz_Int, X86::VFNMSUB132SHZmkz_Int, TB_NO_REVERSE},
{X86::VFNMSUB132SSZrk_Int, X86::VFNMSUB132SSZmk_Int, TB_NO_REVERSE},
{X86::VFNMSUB132SSZrkz_Int, X86::VFNMSUB132SSZmkz_Int, TB_NO_REVERSE},
- {X86::VFNMSUB213NEPBF16Z128rk, X86::VFNMSUB213NEPBF16Z128mk, 0},
- {X86::VFNMSUB213NEPBF16Z128rkz, X86::VFNMSUB213NEPBF16Z128mkz, 0},
- {X86::VFNMSUB213NEPBF16Z256rk, X86::VFNMSUB213NEPBF16Z256mk, 0},
- {X86::VFNMSUB213NEPBF16Z256rkz, X86::VFNMSUB213NEPBF16Z256mkz, 0},
- {X86::VFNMSUB213NEPBF16Zrk, X86::VFNMSUB213NEPBF16Zmk, 0},
- {X86::VFNMSUB213NEPBF16Zrkz, X86::VFNMSUB213NEPBF16Zmkz, 0},
+ {X86::VFNMSUB213BF16Z128rk, X86::VFNMSUB213BF16Z128mk, 0},
+ {X86::VFNMSUB213BF16Z128rkz, X86::VFNMSUB213BF16Z128mkz, 0},
+ {X86::VFNMSUB213BF16Z256rk, X86::VFNMSUB213BF16Z256mk, 0},
+ {X86::VFNMSUB213BF16Z256rkz, X86::VFNMSUB213BF16Z256mkz, 0},
+ {X86::VFNMSUB213BF16Zrk, X86::VFNMSUB213BF16Zmk, 0},
+ {X86::VFNMSUB213BF16Zrkz, X86::VFNMSUB213BF16Zmkz, 0},
{X86::VFNMSUB213PDZ128rk, X86::VFNMSUB213PDZ128mk, 0},
{X86::VFNMSUB213PDZ128rkz, X86::VFNMSUB213PDZ128mkz, 0},
{X86::VFNMSUB213PDZ256rk, X86::VFNMSUB213PDZ256mk, 0},
@@ -6654,12 +6654,12 @@ static const X86FoldTableEntry Table4[] = {
{X86::VFNMSUB213SHZrkz_Int, X86::VFNMSUB213SHZmkz_Int, TB_NO_REVERSE},
{X86::VFNMSUB213SSZrk_Int, X86::VFNMSUB213SSZmk_Int, TB_NO_REVERSE},
{X86::VFNMSUB213SSZrkz_Int, X86::VFNMSUB213SSZmkz_Int, TB_NO_REVERSE},
- {X86::VFNMSUB231NEPBF16Z128rk, X86::VFNMSUB231NEPBF16Z128mk, 0},
- {X86::VFNMSUB231NEPBF16Z128rkz, X86::VFNMSUB231NEPBF16Z128mkz, 0},
- {X86::VFNMSUB231NEPBF16Z256rk, X86::VFNMSUB231NEPBF16Z256mk, 0},
- {X86::VFNMSUB231NEPBF16Z256rkz, X86::VFNMSUB231NEPBF16Z256mkz, 0},
- {X86::VFNMSUB231NEPBF16Zrk, X86::VFNMSUB231NEPBF16Zmk, 0},
- {X86::VFNMSUB231NEPBF16Zrkz, X86::VFNMSUB231NEPBF16Zmkz, 0},
+ {X86::VFNMSUB231BF16Z128rk, X86::VFNMSUB231BF16Z128mk, 0},
+ {X86::VFNMSUB231BF16Z128rkz, X86::VFNMSUB231BF16Z128mkz, 0},
+ {X86::VFNMSUB231BF16Z256rk, X86::VFNMSUB231BF16Z256mk, 0},
+ {X86::VFNMSUB231BF16Z256rkz, X86::VFNMSUB231BF16Z256mkz, 0},
+ {X86::VFNMSUB231BF16Zrk, X86::VFNMSUB231BF16Zmk, 0},
+ {X86::VFNMSUB231BF16Zrkz, X86::VFNMSUB231BF16Zmkz, 0},
{X86::VFNMSUB231PDZ128rk, X86::VFNMSUB231PDZ128mk, 0},
{X86::VFNMSUB231PDZ128rkz, X86::VFNMSUB231PDZ128mkz, 0},
{X86::VFNMSUB231PDZ256rk, X86::VFNMSUB231PDZ256mk, 0},
@@ -6711,6 +6711,9 @@ static const X86FoldTableEntry Table4[] = {
{X86::VINSERTI64X2Z256rrik, X86::VINSERTI64X2Z256rmik, 0},
{X86::VINSERTI64X2Zrrik, X86::VINSERTI64X2Zrmik, 0},
{X86::VINSERTI64X4Zrrik, X86::VINSERTI64X4Zrmik, 0},
+ {X86::VMAXBF16Z128rrk, X86::VMAXBF16Z128rmk, 0},
+ {X86::VMAXBF16Z256rrk, X86::VMAXBF16Z256rmk, 0},
+ {X86::VMAXBF16Zrrk, X86::VMAXBF16Zrmk, 0},
{X86::VMAXCPDZ128rrk, X86::VMAXCPDZ128rmk, 0},
{X86::VMAXCPDZ256rrk, X86::VMAXCPDZ256rmk, 0},
{X86::VMAXCPDZrrk, X86::VMAXCPDZrmk, 0},
@@ -6720,9 +6723,6 @@ static const X86FoldTableEntry Table4[] = {
{X86::VMAXCPSZ128rrk, X86::VMAXCPSZ128rmk, 0},
{X86::VMAXCPSZ256rrk, X86::VMAXCPSZ256rmk, 0},
{X86::VMAXCPSZrrk, X86::VMAXCPSZrmk, 0},
- {X86::VMAXPBF16Z128rrk, X86::VMAXPBF16Z128rmk, 0},
- {X86::VMAXPBF16Z256rrk, X86::VMAXPBF16Z256rmk, 0},
- {X86::VMAXPBF16Zrrk, X86::VMAXPBF16Zrmk, 0},
{X86::VMAXPDZ128rrk, X86::VMAXPDZ128rmk, 0},
{X86::VMAXPDZ256rrk, X86::VMAXPDZ256rmk, 0},
{X86::VMAXPDZrrk, X86::VMAXPDZrmk, 0},
@@ -6735,6 +6735,9 @@ static const X86FoldTableEntry Table4[] = {
{X86::VMAXSDZrrk_Int, X86::VMAXSDZrmk_Int, TB_NO_REVERSE},
{X86::VMAXSHZrrk_Int, X86::VMAXSHZrmk_Int, TB_NO_REVERSE},
{X86::VMAXSSZrrk_Int, X86::VMAXSSZrmk_Int, TB_NO_REVERSE},
+ {X86::VMINBF16Z128rrk, X86::VMINBF16Z128rmk, 0},
+ {X86::VMINBF16Z256rrk, X86::VMINBF16Z256rmk, 0},
+ {X86::VMINBF16Zrrk, X86::VMINBF16Zrmk, 0},
{X86::VMINCPDZ128rrk, X86::VMINCPDZ128rmk, 0},
{X86::VMINCPDZ256rrk, X86::VMINCPDZ256rmk, 0},
{X86::VMINCPDZrrk, X86::VMINCPDZrmk, 0},
@@ -6759,9 +6762,6 @@ static const X86FoldTableEntry Table4[] = {
{X86::VMINMAXSDrrik_Int, X86::VMINMAXSDrmik_Int, TB_NO_REVERSE},
{X86::VMINMAXSHrrik_Int, X86::VMINMAXSHrmik_Int, TB_NO_REVERSE},
{X86::VMINMAXSSrrik_Int, X86::VMINMAXSSrmik_Int, TB_NO_REVERSE},
- {X86::VMINPBF16Z128rrk, X86::VMINPBF16Z128rmk, 0},
- {X86::VMINPBF16Z256rrk, X86::VMINPBF16Z256rmk, 0},
- {X86::VMINPBF16Zrrk, X86::VMINPBF16Zrmk, 0},
{X86::VMINPDZ128rrk, X86::VMINPDZ128rmk, 0},
{X86::VMINPDZ256rrk, X86::VMINPDZ256rmk, 0},
{X86::VMINPDZrrk, X86::VMINPDZrmk, 0},
@@ -6777,9 +6777,9 @@ static const X86FoldTableEntry Table4[] = {
{X86::VMPSADBWZ128rrik, X86::VMPSADBWZ128rmik, 0},
{X86::VMPSADBWZ256rrik, X86::VMPSADBWZ256rmik, 0},
{X86::VMPSADBWZrrik, X86::VMPSADBWZrmik, 0},
- {X86::VMULNEPBF16Z128rrk, X86::VMULNEPBF16Z128rmk, 0},
- {X86::VMULNEPBF16Z256rrk, X86::VMULNEPBF16Z256rmk, 0},
- {X86::VMULNEPBF16Zrrk, X86::VMULNEPBF16Zrmk, 0},
+ {X86::VMULBF16Z128rrk, X86::VMULBF16Z128rmk, 0},
+ {X86::VMULBF16Z256rrk, X86::VMULBF16Z256rmk, 0},
+ {X86::VMULBF16Zrrk, X86::VMULBF16Zrmk, 0},
{X86::VMULPDZ128rrk, X86::VMULPDZ128rmk, 0},
{X86::VMULPDZ256rrk, X86::VMULPDZ256rmk, 0},
{X86::VMULPDZrrk, X86::VMULPDZrmk, 0},
@@ -7355,9 +7355,9 @@ static const X86FoldTableEntry Table4[] = {
{X86::VRSQRT28SDZrk, X86::VRSQRT28SDZmk, TB_NO_REVERSE},
{X86::VRSQRT28SSZrk, X86::VRSQRT28SSZmk, TB_NO_REVERSE},
{X86::VRSQRTSHZrrk, X86::VRSQRTSHZrmk, TB_NO_REVERSE},
- {X86::VSCALEFPBF16Z128rrk, X86::VSCALEFPBF16Z128rmk, 0},
- {X86::VSCALEFPBF16Z256rrk, X86::VSCALEFPBF16Z256rmk, 0},
- {X86::VSCALEFPBF16Zrrk, X86::VSCALEFPBF16Zrmk, 0},
+ {X86::VSCALEFBF16Z128rrk, X86::VSCALEFBF16Z128rmk, 0},
+ {X86::VSCALEFBF16Z256rrk, X86::VSCALEFBF16Z256rmk, 0},
+ {X86::VSCALEFBF16Zrrk, X86::VSCALEFBF16Zrmk, 0},
{X86::VSCALEFPDZ128rrk, X86::VSCALEFPDZ128rmk, 0},
{X86::VSCALEFPDZ256rrk, X86::VSCALEFPDZ256rmk, 0},
{X86::VSCALEFPDZrrk, X86::VSCALEFPDZrmk, 0},
@@ -7387,9 +7387,9 @@ static const X86FoldTableEntry Table4[] = {
{X86::VSQRTSDZrk_Int, X86::VSQRTSDZmk_Int, TB_NO_REVERSE},
{X86::VSQRTSHZrk_Int, X86::VSQRTSHZmk_Int, TB_NO_REVERSE},
{X86::VSQRTSSZrk_Int, X86::VSQRTSSZmk_Int, TB_NO_REVERSE},
- {X86::VSUBNEPBF16Z128rrk, X86::VSUBNEPBF16Z128rmk, 0},
- {X86::VSUBNEPBF16Z256rrk, X86::VSUBNEPBF16Z256rmk, 0},
- {X86::VSUBNEPBF16Zrrk, X86::VSUBNEPBF16Zrmk, 0},
+ {X86::VSUBBF16Z128rrk, X86::VSUBBF16Z128rmk, 0},
+ {X86::VSUBBF16Z256rrk, X86::VSUBBF16Z256rmk, 0},
+ {X86::VSUBBF16Zrrk, X86::VSUBBF16Zrmk, 0},
{X86::VSUBPDZ128rrk, X86::VSUBPDZ128rmk, 0},
{X86::VSUBPDZ256rrk, X86::VSUBPDZ256rmk, 0},
{X86::VSUBPDZrrk, X86::VSUBPDZrmk, 0},
@@ -7644,9 +7644,9 @@ static const X86FoldTableEntry BroadcastTable1[] = {
{X86::VCVTW2PHZrr, X86::VCVTW2PHZrmb, TB_BCAST_W},
{X86::VEXP2PDZr, X86::VEXP2PDZmb, TB_BCAST_SD},
{X86::VEXP2PSZr, X86::VEXP2PSZmb, TB_BCAST_SS},
- {X86::VFPCLASSPBF16Z128ri, X86::VFPCLASSPBF16Z128mbi, TB_BCAST_SH},
- {X86::VFPCLASSPBF16Z256ri, X86::VFPCLASSPBF16Z256mbi, TB_BCAST_SH},
- {X86::VFPCLASSPBF16Zri, X86::VFPCLASSPBF16Zmbi, TB_BCAST_SH},
+ {X86::VFPCLASSBF16Z128ri, X86::VFPCLASSBF16Z128mbi, TB_BCAST_SH},
+ {X86::VFPCLASSBF16Z256ri, X86::VFPCLASSBF16Z256mbi, TB_BCAST_SH},
+ {X86::VFPCLASSBF16Zri, X86::VFPCLASSBF16Zmbi, TB_BCAST_SH},
{X86::VFPCLASSPDZ128ri, X86::VFPCLASSPDZ128mbi, TB_BCAST_SD},
{X86::VFPCLASSPDZ256ri, X86::VFPCLASSPDZ256mbi, TB_BCAST_SD},
{X86::VFPCLASSPDZri, X86::VFPCLASSPDZmbi, TB_BCAST_SD},
@@ -7656,9 +7656,9 @@ static const X86FoldTableEntry BroadcastTable1[] = {
{X86::VFPCLASSPSZ128ri, X86::VFPCLASSPSZ128mbi, TB_BCAST_SS},
{X86::VFPCLASSPSZ256ri, X86::VFPCLASSPSZ256mbi, TB_BCAST_SS},
{X86::VFPCLASSPSZri, X86::VFPCLASSPSZmbi, TB_BCAST_SS},
- {X86::VGETEXPPBF16Z128r, X86::VGETEXPPBF16Z128mb, TB_BCAST_SH},
- {X86::VGETEXPPBF16Z256r, X86::VGETEXPPBF16Z256mb, TB_BCAST_SH},
- {X86::VGETEXPPBF16Zr, X86::VGETEXPPBF16Zmb, TB_BCAST_SH},
+ {X86::VGETEXPBF16Z128r, X86::VGETEXPBF16Z128mb, TB_BCAST_SH},
+ {X86::VGETEXPBF16Z256r, X86::VGETEXPBF16Z256mb, TB_BCAST_SH},
+ {X86::VGETEXPBF16Zr, X86::VGETEXPBF16Zmb, TB_BCAST_SH},
{X86::VGETEXPPDZ128r, X86::VGETEXPPDZ128mb, TB_BCAST_SD},
{X86::VGETEXPPDZ256r, X86::VGETEXPPDZ256mb, TB_BCAST_SD},
{X86::VGETEXPPDZr, X86::VGETEXPPDZmb, TB_BCAST_SD},
@@ -7668,9 +7668,9 @@ static const X86FoldTableEntry BroadcastTable1[] = {
{X86::VGETEXPPSZ128r, X86::VGETEXPPSZ128mb, TB_BCAST_SS},
{X86::VGETEXPPSZ256r, X86::VGETEXPPSZ256mb, TB_BCAST_SS},
{X86::VGETEXPPSZr, X86::VGETEXPPSZmb, TB_BCAST_SS},
- {X86::VGETMANTPBF16Z128rri, X86::VGETMANTPBF16Z128rmbi, TB_BCAST_SH},
- {X86::VGETMANTPBF16Z256rri, X86::VGETMANTPBF16Z256rmbi, TB_BCAST_SH},
- {X86::VGETMANTPBF16Zrri, X86::VGETMANTPBF16Zrmbi, TB_BCAST_SH},
+ {X86::VGETMANTBF16Z128rri, X86::VGETMANTBF16Z128rmbi, TB_BCAST_SH},
+ {X86::VGETMANTBF16Z256rri, X86::VGETMANTBF16Z256rmbi, TB_BCAST_SH},
+ {X86::VGETMANTBF16Zrri, X86::VGETMANTBF16Zrmbi, TB_BCAST_SH},
{X86::VGETMANTPDZ128rri, X86::VGETMANTPDZ128rmbi, TB_BCAST_SD},
{X86::VGETMANTPDZ256rri, X86::VGETMANTPDZ256rmbi, TB_BCAST_SD},
{X86::VGETMANTPDZrri, X86::VGETMANTPDZrmbi, TB_BCAST_SD},
@@ -7755,15 +7755,15 @@ static const X86FoldTableEntry BroadcastTable1[] = {
{X86::VRCP14PSZr, X86::VRCP14PSZmb, TB_BCAST_SS},
{X86::VRCP28PDZr, X86::VRCP28PDZmb, TB_BCAST_SD},
{X86::VRCP28PSZr, X86::VRCP28PSZmb, TB_BCAST_SS},
- {X86::VRCPPBF16Z128r, X86::VRCPPBF16Z128mb, TB_BCAST_SH},
- {X86::VRCPPBF16Z256r, X86::VRCPPBF16Z256mb, TB_BCAST_SH},
- {X86::VRCPPBF16Zr, X86::VRCPPBF16Zmb, TB_BCAST_SH},
+ {X86::VRCPBF16Z128r, X86::VRCPBF16Z128mb, TB_BCAST_SH},
+ {X86::VRCPBF16Z256r, X86::VRCPBF16Z256mb, TB_BCAST_SH},
+ {X86::VRCPBF16Zr, X86::VRCPBF16Zmb, TB_BCAST_SH},
{X86::VRCPPHZ128r, X86::VRCPPHZ128mb, TB_BCAST_SH},
{X86::VRCPPHZ256r, X86::VRCPPHZ256mb, TB_BCAST_SH},
{X86::VRCPPHZr, X86::VRCPPHZmb, TB_BCAST_SH},
- {X86::VREDUCENEPBF16Z128rri, X86::VREDUCENEPBF16Z128rmbi, TB_BCAST_SH},
- {X86::VREDUCENEPBF16Z256rri, X86::VREDUCENEPBF16Z256rmbi, TB_BCAST_SH},
- {X86::VREDUCENEPBF16Zrri, X86::VREDUCENEPBF16Zrmbi, TB_BCAST_SH},
+ {X86::VREDUCEBF16Z128rri, X86::VREDUCEBF16Z128rmbi, TB_BCAST_SH},
+ {X86::VREDUCEBF16Z256rri, X86::VREDUCEBF16Z256rmbi, TB_BCAST_SH},
+ {X86::VREDUCEBF16Zrri, X86::VREDUCEBF16Zrmbi, TB_BCAST_SH},
{X86::VREDUCEPDZ128rri, X86::VREDUCEPDZ128rmbi, TB_BCAST_SD},
{X86::VREDUCEPDZ256rri, X86::VREDUCEPDZ256rmbi, TB_BCAST_SD},
{X86::VREDUCEPDZrri, X86::VREDUCEPDZrmbi, TB_BCAST_SD},
@@ -7773,9 +7773,9 @@ static const X86FoldTableEntry BroadcastTable1[] = {
{X86::VREDUCEPSZ128rri, X86::VREDUCEPSZ128rmbi, TB_BCAST_SS},
{X86::VREDUCEPSZ256rri, X86::VREDUCEPSZ256rmbi, TB_BCAST_SS},
{X86::VREDUCEPSZrri, X86::VREDUCEPSZrmbi, TB_BCAST_SS},
- {X86::VRNDSCALENEPBF16Z128rri, X86::VRNDSCALENEPBF16Z128rmbi, TB_BCAST_SH},
- {X86::VRNDSCALENEPBF16Z256rri, X86::VRNDSCALENEPBF16Z256rmbi, TB_BCAST_SH},
- {X86::VRNDSCALENEPBF16Zrri, X86::VRNDSCALENEPBF16Zrmbi, TB_BCAST_SH},
+ {X86::VRNDSCALEBF16Z128rri, X86::VRNDSCALEBF16Z128rmbi, TB_BCAST_SH},
+ {X86::VRNDSCALEBF16Z256rri, X86::VRNDSCALEBF16Z256rmbi, TB_BCAST_SH},
+ {X86::VRNDSCALEBF16Zrri, X86::VRNDSCALEBF16Zrmbi, TB_BCAST_SH},
{X86::VRNDSCALEPDZ128rri, X86::VRNDSCALEPDZ128rmbi, TB_BCAST_SD},
{X86::VRNDSCALEPDZ256rri, X86::VRNDSCALEPDZ256rmbi, TB_BCAST_SD},
{X86::VRNDSCALEPDZrri, X86::VRNDSCALEPDZrmbi, TB_BCAST_SD},
@@ -7793,15 +7793,15 @@ static const X86FoldTableEntry BroadcastTable1[] = {
{X86::VRSQRT14PSZr, X86::VRSQRT14PSZmb, TB_BCAST_SS},
{X86::VRSQRT28PDZr, X86::VRSQRT28PDZmb, TB_BCAST_SD},
{X86::VRSQRT28PSZr, X86::VRSQRT28PSZmb, TB_BCAST_SS},
- {X86::VRSQRTPBF16Z128r, X86::VRSQRTPBF16Z128mb, TB_BCAST_SH},
- {X86::VRSQRTPBF16Z256r, X86::VRSQRTPBF16Z256mb, TB_BCAST_SH},
- {X86::VRSQRTPBF16Zr, X86::VRSQRTPBF16Zmb, TB_BCAST_SH},
+ {X86::VRSQRTBF16Z128r, X86::VRSQRTBF16Z128mb, TB_BCAST_SH},
+ {X86::VRSQRTBF16Z256r, X86::VRSQRTBF16Z256mb, TB_BCAST_SH},
+ {X86::VRSQRTBF16Zr, X86::VRSQRTBF16Zmb, TB_BCAST_SH},
{X86::VRSQRTPHZ128r, X86::VRSQRTPHZ128mb, TB_BCAST_SH},
{X86::VRSQRTPHZ256r, X86::VRSQRTPHZ256mb, TB_BCAST_SH},
{X86::VRSQRTPHZr, X86::VRSQRTPHZmb, TB_BCAST_SH},
- {X86::VSQRTNEPBF16Z128r, X86::VSQRTNEPBF16Z128mb, TB_BCAST_SH},
- {X86::VSQRTNEPBF16Z256r, X86::VSQRTNEPBF16Z256mb, TB_BCAST_SH},
- {X86::VSQRTNEPBF16Zr, X86::VSQRTNEPBF16Zmb, TB_BCAST_SH},
+ {X86::VSQRTBF16Z128r, X86::VSQRTBF16Z128mb, TB_BCAST_SH},
+ {X86::VSQRTBF16Z256r, X86::VSQRTBF16Z256mb, TB_BCAST_SH},
+ {X86::VSQRTBF16Zr, X86::VSQRTBF16Zmb, TB_BCAST_SH},
{X86::VSQRTPDZ128r, X86::VSQRTPDZ128mb, TB_BCAST_SD},
{X86::VSQRTPDZ256r, X86::VSQRTPDZ256mb, TB_BCAST_SD},
{X86::VSQRTPDZr, X86::VSQRTPDZmb, TB_BCAST_SD},
@@ -7814,9 +7814,9 @@ static const X86FoldTableEntry BroadcastTable1[] = {
};
static const X86FoldTableEntry BroadcastTable2[] = {
- {X86::VADDNEPBF16Z128rr, X86::VADDNEPBF16Z128rmb, TB_BCAST_SH},
- {X86::VADDNEPBF16Z256rr, X86::VADDNEPBF16Z256rmb, TB_BCAST_SH},
- {X86::VADDNEPBF16Zrr, X86::VADDNEPBF16Zrmb, TB_BCAST_SH},
+ {X86::VADDBF16Z128rr, X86::VADDBF16Z128rmb, TB_BCAST_SH},
+ {X86::VADDBF16Z256rr, X86::VADDBF16Z256rmb, TB_BCAST_SH},
+ {X86::VADDBF16Zrr, X86::VADDBF16Zrmb, TB_BCAST_SH},
{X86::VADDPDZ128rr, X86::VADDPDZ128rmb, TB_BCAST_SD},
{X86::VADDPDZ256rr, X86::VADDPDZ256rmb, TB_BCAST_SD},
{X86::VADDPDZrr, X86::VADDPDZrmb, TB_BCAST_SD},
@@ -7850,9 +7850,9 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VBLENDMPSZ128rr, X86::VBLENDMPSZ128rmb, TB_BCAST_SS},
{X86::VBLENDMPSZ256rr, X86::VBLENDMPSZ256rmb, TB_BCAST_SS},
{X86::VBLENDMPSZrr, X86::VBLENDMPSZrmb, TB_BCAST_SS},
- {X86::VCMPPBF16Z128rri, X86::VCMPPBF16Z128rmbi, TB_BCAST_SH},
- {X86::VCMPPBF16Z256rri, X86::VCMPPBF16Z256rmbi, TB_BCAST_SH},
- {X86::VCMPPBF16Zrri, X86::VCMPPBF16Zrmbi, TB_BCAST_SH},
+ {X86::VCMPBF16Z128rri, X86::VCMPBF16Z128rmbi, TB_BCAST_SH},
+ {X86::VCMPBF16Z256rri, X86::VCMPBF16Z256rmbi, TB_BCAST_SH},
+ {X86::VCMPBF16Zrri, X86::VCMPBF16Zrmbi, TB_BCAST_SH},
{X86::VCMPPDZ128rri, X86::VCMPPDZ128rmbi, TB_BCAST_SD},
{X86::VCMPPDZ256rri, X86::VCMPPDZ256rmbi, TB_BCAST_SD},
{X86::VCMPPDZrri, X86::VCMPPDZrmbi, TB_BCAST_SD},
@@ -8111,9 +8111,9 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VCVTW2PHZ128rrkz, X86::VCVTW2PHZ128rmbkz, TB_BCAST_W},
{X86::VCVTW2PHZ256rrkz, X86::VCVTW2PHZ256rmbkz, TB_BCAST_W},
{X86::VCVTW2PHZrrkz, X86::VCVTW2PHZrmbkz, TB_BCAST_W},
- {X86::VDIVNEPBF16Z128rr, X86::VDIVNEPBF16Z128rmb, TB_BCAST_SH},
- {X86::VDIVNEPBF16Z256rr, X86::VDIVNEPBF16Z256rmb, TB_BCAST_SH},
- {X86::VDIVNEPBF16Zrr, X86::VDIVNEPBF16Zrmb, TB_BCAST_SH},
+ {X86::VDIVBF16Z128rr, X86::VDIVBF16Z128rmb, TB_BCAST_SH},
+ {X86::VDIVBF16Z256rr, X86::VDIVBF16Z256rmb, TB_BCAST_SH},
+ {X86::VDIVBF16Zrr, X86::VDIVBF16Zrmb, TB_BCAST_SH},
{X86::VDIVPDZ128rr, X86::VDIVPDZ128rmb, TB_BCAST_SD},
{X86::VDIVPDZ256rr, X86::VDIVPDZ256rmb, TB_BCAST_SD},
{X86::VDIVPDZrr, X86::VDIVPDZrmb, TB_BCAST_SD},
@@ -8131,9 +8131,9 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VFMULCPHZ128rr, X86::VFMULCPHZ128rmb, TB_BCAST_SS},
{X86::VFMULCPHZ256rr, X86::VFMULCPHZ256rmb, TB_BCAST_SS},
{X86::VFMULCPHZrr, X86::VFMULCPHZrmb, TB_BCAST_SS},
- {X86::VFPCLASSPBF16Z128rik, X86::VFPCLASSPBF16Z128mbik, TB_BCAST_SH},
- {X86::VFPCLASSPBF16Z256rik, X86::VFPCLASSPBF16Z256mbik, TB_BCAST_SH},
- {X86::VFPCLASSPBF16Zrik, X86::VFPCLASSPBF16Zmbik, TB_BCAST_SH},
+ {X86::VFPCLASSBF16Z128rik, X86::VFPCLASSBF16Z128mbik, TB_BCAST_SH},
+ {X86::VFPCLASSBF16Z256rik, X86::VFPCLASSBF16Z256mbik, TB_BCAST_SH},
+ {X86::VFPCLASSBF16Zrik, X86::VFPCLASSBF16Zmbik, TB_BCAST_SH},
{X86::VFPCLASSPDZ128rik, X86::VFPCLASSPDZ128mbik, TB_BCAST_SD},
{X86::VFPCLASSPDZ256rik, X86::VFPCLASSPDZ256mbik, TB_BCAST_SD},
{X86::VFPCLASSPDZrik, X86::VFPCLASSPDZmbik, TB_BCAST_SD},
@@ -8143,9 +8143,9 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VFPCLASSPSZ128rik, X86::VFPCLASSPSZ128mbik, TB_BCAST_SS},
{X86::VFPCLASSPSZ256rik, X86::VFPCLASSPSZ256mbik, TB_BCAST_SS},
{X86::VFPCLASSPSZrik, X86::VFPCLASSPSZmbik, TB_BCAST_SS},
- {X86::VGETEXPPBF16Z128rkz, X86::VGETEXPPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VGETEXPPBF16Z256rkz, X86::VGETEXPPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VGETEXPPBF16Zrkz, X86::VGETEXPPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VGETEXPBF16Z128rkz, X86::VGETEXPBF16Z128mbkz, TB_BCAST_SH},
+ {X86::VGETEXPBF16Z256rkz, X86::VGETEXPBF16Z256mbkz, TB_BCAST_SH},
+ {X86::VGETEXPBF16Zrkz, X86::VGETEXPBF16Zmbkz, TB_BCAST_SH},
{X86::VGETEXPPDZ128rkz, X86::VGETEXPPDZ128mbkz, TB_BCAST_SD},
{X86::VGETEXPPDZ256rkz, X86::VGETEXPPDZ256mbkz, TB_BCAST_SD},
{X86::VGETEXPPDZrkz, X86::VGETEXPPDZmbkz, TB_BCAST_SD},
@@ -8155,9 +8155,9 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VGETEXPPSZ128rkz, X86::VGETEXPPSZ128mbkz, TB_BCAST_SS},
{X86::VGETEXPPSZ256rkz, X86::VGETEXPPSZ256mbkz, TB_BCAST_SS},
{X86::VGETEXPPSZrkz, X86::VGETEXPPSZmbkz, TB_BCAST_SS},
- {X86::VGETMANTPBF16Z128rrikz, X86::VGETMANTPBF16Z128rmbikz, TB_BCAST_SH},
- {X86::VGETMANTPBF16Z256rrikz, X86::VGETMANTPBF16Z256rmbikz, TB_BCAST_SH},
- {X86::VGETMANTPBF16Zrrikz, X86::VGETMANTPBF16Zrmbikz, TB_BCAST_SH},
+ {X86::VGETMANTBF16Z128rrikz, X86::VGETMANTBF16Z128rmbikz, TB_BCAST_SH},
+ {X86::VGETMANTBF16Z256rrikz, X86::VGETMANTBF16Z256rmbikz, TB_BCAST_SH},
+ {X86::VGETMANTBF16Zrrikz, X86::VGETMANTBF16Zrmbikz, TB_BCAST_SH},
{X86::VGETMANTPDZ128rrikz, X86::VGETMANTPDZ128rmbikz, TB_BCAST_SD},
{X86::VGETMANTPDZ256rrikz, X86::VGETMANTPDZ256rmbikz, TB_BCAST_SD},
{X86::VGETMANTPDZrrikz, X86::VGETMANTPDZrmbikz, TB_BCAST_SD},
@@ -8173,6 +8173,9 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VGF2P8AFFINEQBZ128rri, X86::VGF2P8AFFINEQBZ128rmbi, TB_BCAST_Q},
{X86::VGF2P8AFFINEQBZ256rri, X86::VGF2P8AFFINEQBZ256rmbi, TB_BCAST_Q},
{X86::VGF2P8AFFINEQBZrri, X86::VGF2P8AFFINEQBZrmbi, TB_BCAST_Q},
+ {X86::VMAXBF16Z128rr, X86::VMAXBF16Z128rmb, TB_BCAST_SH},
+ {X86::VMAXBF16Z256rr, X86::VMAXBF16Z256rmb, TB_BCAST_SH},
+ {X86::VMAXBF16Zrr, X86::VMAXBF16Zrmb, TB_BCAST_SH},
{X86::VMAXCPDZ128rr, X86::VMAXCPDZ128rmb, TB_BCAST_SD},
{X86::VMAXCPDZ256rr, X86::VMAXCPDZ256rmb, TB_BCAST_SD},
{X86::VMAXCPDZrr, X86::VMAXCPDZrmb, TB_BCAST_SD},
@@ -8182,9 +8185,6 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VMAXCPSZ128rr, X86::VMAXCPSZ128rmb, TB_BCAST_SS},
{X86::VMAXCPSZ256rr, X86::VMAXCPSZ256rmb, TB_BCAST_SS},
{X86::VMAXCPSZrr, X86::VMAXCPSZrmb, TB_BCAST_SS},
- {X86::VMAXPBF16Z128rr, X86::VMAXPBF16Z128rmb, TB_BCAST_SH},
- {X86::VMAXPBF16Z256rr, X86::VMAXPBF16Z256rmb, TB_BCAST_SH},
- {X86::VMAXPBF16Zrr, X86::VMAXPBF16Zrmb, TB_BCAST_SH},
{X86::VMAXPDZ128rr, X86::VMAXPDZ128rmb, TB_BCAST_SD},
{X86::VMAXPDZ256rr, X86::VMAXPDZ256rmb, TB_BCAST_SD},
{X86::VMAXPDZrr, X86::VMAXPDZrmb, TB_BCAST_SD},
@@ -8194,6 +8194,9 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VMAXPSZ128rr, X86::VMAXPSZ128rmb, TB_BCAST_SS},
{X86::VMAXPSZ256rr, X86::VMAXPSZ256rmb, TB_BCAST_SS},
{X86::VMAXPSZrr, X86::VMAXPSZrmb, TB_BCAST_SS},
+ {X86::VMINBF16Z128rr, X86::VMINBF16Z128rmb, TB_BCAST_SH},
+ {X86::VMINBF16Z256rr, X86::VMINBF16Z256rmb, TB_BCAST_SH},
+ {X86::VMINBF16Zrr, X86::VMINBF16Zrmb, TB_BCAST_SH},
{X86::VMINCPDZ128rr, X86::VMINCPDZ128rmb, TB_BCAST_SD},
{X86::VMINCPDZ256rr, X86::VMINCPDZ256rmb, TB_BCAST_SD},
{X86::VMINCPDZrr, X86::VMINCPDZrmb, TB_BCAST_SD},
@@ -8215,9 +8218,6 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VMINMAXPSZ128rri, X86::VMINMAXPSZ128rmbi, TB_BCAST_SS},
{X86::VMINMAXPSZ256rri, X86::VMINMAXPSZ256rmbi, TB_BCAST_SS},
{X86::VMINMAXPSZrri, X86::VMINMAXPSZrmbi, TB_BCAST_SS},
- {X86::VMINPBF16Z128rr, X86::VMINPBF16Z128rmb, TB_BCAST_SH},
- {X86::VMINPBF16Z256rr, X86::VMINPBF16Z256rmb, TB_BCAST_SH},
- {X86::VMINPBF16Zrr, X86::VMINPBF16Zrmb, TB_BCAST_SH},
{X86::VMINPDZ128rr, X86::VMINPDZ128rmb, TB_BCAST_SD},
{X86::VMINPDZ256rr, X86::VMINPDZ256rmb, TB_BCAST_SD},
{X86::VMINPDZrr, X86::VMINPDZrmb, TB_BCAST_SD},
@@ -8227,9 +8227,9 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VMINPSZ128rr, X86::VMINPSZ128rmb, TB_BCAST_SS},
{X86::VMINPSZ256rr, X86::VMINPSZ256rmb, TB_BCAST_SS},
{X86::VMINPSZrr, X86::VMINPSZrmb, TB_BCAST_SS},
- {X86::VMULNEPBF16Z128rr, X86::VMULNEPBF16Z128rmb, TB_BCAST_SH},
- {X86::VMULNEPBF16Z256rr, X86::VMULNEPBF16Z256rmb, TB_BCAST_SH},
- {X86::VMULNEPBF16Zrr, X86::VMULNEPBF16Zrmb, TB_BCAST_SH},
+ {X86::VMULBF16Z128rr, X86::VMULBF16Z128rmb, TB_BCAST_SH},
+ {X86::VMULBF16Z256rr, X86::VMULBF16Z256rmb, TB_BCAST_SH},
+ {X86::VMULBF16Zrr, X86::VMULBF16Zrmb, TB_BCAST_SH},
{X86::VMULPDZ128rr, X86::VMULPDZ128rmb, TB_BCAST_SD},
{X86::VMULPDZ256rr, X86::VMULPDZ256rmb, TB_BCAST_SD},
{X86::VMULPDZrr, X86::VMULPDZrmb, TB_BCAST_SD},
@@ -8523,15 +8523,15 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VRCP14PSZrkz, X86::VRCP14PSZmbkz, TB_BCAST_SS},
{X86::VRCP28PDZrkz, X86::VRCP28PDZmbkz, TB_BCAST_SD},
{X86::VRCP28PSZrkz, X86::VRCP28PSZmbkz, TB_BCAST_SS},
- {X86::VRCPPBF16Z128rkz, X86::VRCPPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VRCPPBF16Z256rkz, X86::VRCPPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VRCPPBF16Zrkz, X86::VRCPPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VRCPBF16Z128rkz, X86::VRCPBF16Z128mbkz, TB_BCAST_SH},
+ {X86::VRCPBF16Z256rkz, X86::VRCPBF16Z256mbkz, TB_BCAST_SH},
+ {X86::VRCPBF16Zrkz, X86::VRCPBF16Zmbkz, TB_BCAST_SH},
{X86::VRCPPHZ128rkz, X86::VRCPPHZ128mbkz, TB_BCAST_SH},
{X86::VRCPPHZ256rkz, X86::VRCPPHZ256mbkz, TB_BCAST_SH},
{X86::VRCPPHZrkz, X86::VRCPPHZmbkz, TB_BCAST_SH},
- {X86::VREDUCENEPBF16Z128rrikz, X86::VREDUCENEPBF16Z128rmbikz, TB_BCAST_SH},
- {X86::VREDUCENEPBF16Z256rrikz, X86::VREDUCENEPBF16Z256rmbikz, TB_BCAST_SH},
- {X86::VREDUCENEPBF16Zrrikz, X86::VREDUCENEPBF16Zrmbikz, TB_BCAST_SH},
+ {X86::VREDUCEBF16Z128rrikz, X86::VREDUCEBF16Z128rmbikz, TB_BCAST_SH},
+ {X86::VREDUCEBF16Z256rrikz, X86::VREDUCEBF16Z256rmbikz, TB_BCAST_SH},
+ {X86::VREDUCEBF16Zrrikz, X86::VREDUCEBF16Zrmbikz, TB_BCAST_SH},
{X86::VREDUCEPDZ128rrikz, X86::VREDUCEPDZ128rmbikz, TB_BCAST_SD},
{X86::VREDUCEPDZ256rrikz, X86::VREDUCEPDZ256rmbikz, TB_BCAST_SD},
{X86::VREDUCEPDZrrikz, X86::VREDUCEPDZrmbikz, TB_BCAST_SD},
@@ -8541,9 +8541,9 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VREDUCEPSZ128rrikz, X86::VREDUCEPSZ128rmbikz, TB_BCAST_SS},
{X86::VREDUCEPSZ256rrikz, X86::VREDUCEPSZ256rmbikz, TB_BCAST_SS},
{X86::VREDUCEPSZrrikz, X86::VREDUCEPSZrmbikz, TB_BCAST_SS},
- {X86::VRNDSCALENEPBF16Z128rrikz, X86::VRNDSCALENEPBF16Z128rmbikz, TB_BCAST_SH},
- {X86::VRNDSCALENEPBF16Z256rrikz, X86::VRNDSCALENEPBF16Z256rmbikz, TB_BCAST_SH},
- {X86::VRNDSCALENEPBF16Zrrikz, X86::VRNDSCALENEPBF16Zrmbikz, TB_BCAST_SH},
+ {X86::VRNDSCALEBF16Z128rrikz, X86::VRNDSCALEBF16Z128rmbikz, TB_BCAST_SH},
+ {X86::VRNDSCALEBF16Z256rrikz, X86::VRNDSCALEBF16Z256rmbikz, TB_BCAST_SH},
+ {X86::VRNDSCALEBF16Zrrikz, X86::VRNDSCALEBF16Zrmbikz, TB_BCAST_SH},
{X86::VRNDSCALEPDZ128rrikz, X86::VRNDSCALEPDZ128rmbikz, TB_BCAST_SD},
{X86::VRNDSCALEPDZ256rrikz, X86::VRNDSCALEPDZ256rmbikz, TB_BCAST_SD},
{X86::VRNDSCALEPDZrrikz, X86::VRNDSCALEPDZrmbikz, TB_BCAST_SD},
@@ -8561,15 +8561,15 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VRSQRT14PSZrkz, X86::VRSQRT14PSZmbkz, TB_BCAST_SS},
{X86::VRSQRT28PDZrkz, X86::VRSQRT28PDZmbkz, TB_BCAST_SD},
{X86::VRSQRT28PSZrkz, X86::VRSQRT28PSZmbkz, TB_BCAST_SS},
- {X86::VRSQRTPBF16Z128rkz, X86::VRSQRTPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VRSQRTPBF16Z256rkz, X86::VRSQRTPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VRSQRTPBF16Zrkz, X86::VRSQRTPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VRSQRTBF16Z128rkz, X86::VRSQRTBF16Z128mbkz, TB_BCAST_SH},
+ {X86::VRSQRTBF16Z256rkz, X86::VRSQRTBF16Z256mbkz, TB_BCAST_SH},
+ {X86::VRSQRTBF16Zrkz, X86::VRSQRTBF16Zmbkz, TB_BCAST_SH},
{X86::VRSQRTPHZ128rkz, X86::VRSQRTPHZ128mbkz, TB_BCAST_SH},
{X86::VRSQRTPHZ256rkz, X86::VRSQRTPHZ256mbkz, TB_BCAST_SH},
{X86::VRSQRTPHZrkz, X86::VRSQRTPHZmbkz, TB_BCAST_SH},
- {X86::VSCALEFPBF16Z128rr, X86::VSCALEFPBF16Z128rmb, TB_BCAST_SH},
- {X86::VSCALEFPBF16Z256rr, X86::VSCALEFPBF16Z256rmb, TB_BCAST_SH},
- {X86::VSCALEFPBF16Zrr, X86::VSCALEFPBF16Zrmb, TB_BCAST_SH},
+ {X86::VSCALEFBF16Z128rr, X86::VSCALEFBF16Z128rmb, TB_BCAST_SH},
+ {X86::VSCALEFBF16Z256rr, X86::VSCALEFBF16Z256rmb, TB_BCAST_SH},
+ {X86::VSCALEFBF16Zrr, X86::VSCALEFBF16Zrmb, TB_BCAST_SH},
{X86::VSCALEFPDZ128rr, X86::VSCALEFPDZ128rmb, TB_BCAST_SD},
{X86::VSCALEFPDZ256rr, X86::VSCALEFPDZ256rmb, TB_BCAST_SD},
{X86::VSCALEFPDZrr, X86::VSCALEFPDZrmb, TB_BCAST_SD},
@@ -8593,9 +8593,9 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VSHUFPSZ128rri, X86::VSHUFPSZ128rmbi, TB_BCAST_SS},
{X86::VSHUFPSZ256rri, X86::VSHUFPSZ256rmbi, TB_BCAST_SS},
{X86::VSHUFPSZrri, X86::VSHUFPSZrmbi, TB_BCAST_SS},
- {X86::VSQRTNEPBF16Z128rkz, X86::VSQRTNEPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VSQRTNEPBF16Z256rkz, X86::VSQRTNEPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VSQRTNEPBF16Zrkz, X86::VSQRTNEPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VSQRTBF16Z128rkz, X86::VSQRTBF16Z128mbkz, TB_BCAST_SH},
+ {X86::VSQRTBF16Z256rkz, X86::VSQRTBF16Z256mbkz, TB_BCAST_SH},
+ {X86::VSQRTBF16Zrkz, X86::VSQRTBF16Zmbkz, TB_BCAST_SH},
{X86::VSQRTPDZ128rkz, X86::VSQRTPDZ128mbkz, TB_BCAST_SD},
{X86::VSQRTPDZ256rkz, X86::VSQRTPDZ256mbkz, TB_BCAST_SD},
{X86::VSQRTPDZrkz, X86::VSQRTPDZmbkz, TB_BCAST_SD},
@@ -8605,9 +8605,9 @@ static const X86FoldTableEntry BroadcastTable2[] = {
{X86::VSQRTPSZ128rkz, X86::VSQRTPSZ128mbkz, TB_BCAST_SS},
{X86::VSQRTPSZ256rkz, X86::VSQRTPSZ256mbkz, TB_BCAST_SS},
{X86::VSQRTPSZrkz, X86::VSQRTPSZmbkz, TB_BCAST_SS},
- {X86::VSUBNEPBF16Z128rr, X86::VSUBNEPBF16Z128rmb, TB_BCAST_SH},
- {X86::VSUBNEPBF16Z256rr, X86::VSUBNEPBF16Z256rmb, TB_BCAST_SH},
- {X86::VSUBNEPBF16Zrr, X86::VSUBNEPBF16Zrmb, TB_BCAST_SH},
+ {X86::VSUBBF16Z128rr, X86::VSUBBF16Z128rmb, TB_BCAST_SH},
+ {X86::VSUBBF16Z256rr, X86::VSUBBF16Z256rmb, TB_BCAST_SH},
+ {X86::VSUBBF16Zrr, X86::VSUBBF16Zrmb, TB_BCAST_SH},
{X86::VSUBPDZ128rr, X86::VSUBPDZ128rmb, TB_BCAST_SD},
{X86::VSUBPDZ256rr, X86::VSUBPDZ256rmb, TB_BCAST_SD},
{X86::VSUBPDZrr, X86::VSUBPDZrmb, TB_BCAST_SD},
@@ -8638,9 +8638,9 @@ static const X86FoldTableEntry BroadcastTable2[] = {
};
static const X86FoldTableEntry BroadcastTable3[] = {
- {X86::VADDNEPBF16Z128rrkz, X86::VADDNEPBF16Z128rmbkz, TB_BCAST_SH},
- {X86::VADDNEPBF16Z256rrkz, X86::VADDNEPBF16Z256rmbkz, TB_BCAST_SH},
- {X86::VADDNEPBF16Zrrkz, X86::VADDNEPBF16Zrmbkz, TB_BCAST_SH},
+ {X86::VADDBF16Z128rrkz, X86::VADDBF16Z128rmbkz, TB_BCAST_SH},
+ {X86::VADDBF16Z256rrkz, X86::VADDBF16Z256rmbkz, TB_BCAST_SH},
+ {X86::VADDBF16Zrrkz, X86::VADDBF16Zrmbkz, TB_BCAST_SH},
{X86::VADDPDZ128rrkz, X86::VADDPDZ128rmbkz, TB_BCAST_SD},
{X86::VADDPDZ256rrkz, X86::VADDPDZ256rmbkz, TB_BCAST_SD},
{X86::VADDPDZrrkz, X86::VADDPDZrmbkz, TB_BCAST_SD},
@@ -8674,9 +8674,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VBLENDMPSZ128rrk, X86::VBLENDMPSZ128rmbk, TB_BCAST_SS},
{X86::VBLENDMPSZ256rrk, X86::VBLENDMPSZ256rmbk, TB_BCAST_SS},
{X86::VBLENDMPSZrrk, X86::VBLENDMPSZrmbk, TB_BCAST_SS},
- {X86::VCMPPBF16Z128rrik, X86::VCMPPBF16Z128rmbik, TB_BCAST_SH},
- {X86::VCMPPBF16Z256rrik, X86::VCMPPBF16Z256rmbik, TB_BCAST_SH},
- {X86::VCMPPBF16Zrrik, X86::VCMPPBF16Zrmbik, TB_BCAST_SH},
+ {X86::VCMPBF16Z128rrik, X86::VCMPBF16Z128rmbik, TB_BCAST_SH},
+ {X86::VCMPBF16Z256rrik, X86::VCMPBF16Z256rmbik, TB_BCAST_SH},
+ {X86::VCMPBF16Zrrik, X86::VCMPBF16Zrmbik, TB_BCAST_SH},
{X86::VCMPPDZ128rrik, X86::VCMPPDZ128rmbik, TB_BCAST_SD},
{X86::VCMPPDZ256rrik, X86::VCMPPDZ256rmbik, TB_BCAST_SD},
{X86::VCMPPDZrrik, X86::VCMPPDZrmbik, TB_BCAST_SD},
@@ -8935,9 +8935,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VCVTW2PHZ128rrk, X86::VCVTW2PHZ128rmbk, TB_BCAST_W},
{X86::VCVTW2PHZ256rrk, X86::VCVTW2PHZ256rmbk, TB_BCAST_W},
{X86::VCVTW2PHZrrk, X86::VCVTW2PHZrmbk, TB_BCAST_W},
- {X86::VDIVNEPBF16Z128rrkz, X86::VDIVNEPBF16Z128rmbkz, TB_BCAST_SH},
- {X86::VDIVNEPBF16Z256rrkz, X86::VDIVNEPBF16Z256rmbkz, TB_BCAST_SH},
- {X86::VDIVNEPBF16Zrrkz, X86::VDIVNEPBF16Zrmbkz, TB_BCAST_SH},
+ {X86::VDIVBF16Z128rrkz, X86::VDIVBF16Z128rmbkz, TB_BCAST_SH},
+ {X86::VDIVBF16Z256rrkz, X86::VDIVBF16Z256rmbkz, TB_BCAST_SH},
+ {X86::VDIVBF16Zrrkz, X86::VDIVBF16Zrmbkz, TB_BCAST_SH},
{X86::VDIVPDZ128rrkz, X86::VDIVPDZ128rmbkz, TB_BCAST_SD},
{X86::VDIVPDZ256rrkz, X86::VDIVPDZ256rmbkz, TB_BCAST_SD},
{X86::VDIVPDZrrkz, X86::VDIVPDZrmbkz, TB_BCAST_SD},
@@ -8967,9 +8967,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VFIXUPIMMPSZ128rri, X86::VFIXUPIMMPSZ128rmbi, TB_BCAST_SS},
{X86::VFIXUPIMMPSZ256rri, X86::VFIXUPIMMPSZ256rmbi, TB_BCAST_SS},
{X86::VFIXUPIMMPSZrri, X86::VFIXUPIMMPSZrmbi, TB_BCAST_SS},
- {X86::VFMADD132NEPBF16Z128r, X86::VFMADD132NEPBF16Z128mb, TB_BCAST_SH},
- {X86::VFMADD132NEPBF16Z256r, X86::VFMADD132NEPBF16Z256mb, TB_BCAST_SH},
- {X86::VFMADD132NEPBF16Zr, X86::VFMADD132NEPBF16Zmb, TB_BCAST_SH},
+ {X86::VFMADD132BF16Z128r, X86::VFMADD132BF16Z128mb, TB_BCAST_SH},
+ {X86::VFMADD132BF16Z256r, X86::VFMADD132BF16Z256mb, TB_BCAST_SH},
+ {X86::VFMADD132BF16Zr, X86::VFMADD132BF16Zmb, TB_BCAST_SH},
{X86::VFMADD132PDZ128r, X86::VFMADD132PDZ128mb, TB_BCAST_SD},
{X86::VFMADD132PDZ256r, X86::VFMADD132PDZ256mb, TB_BCAST_SD},
{X86::VFMADD132PDZr, X86::VFMADD132PDZmb, TB_BCAST_SD},
@@ -8979,9 +8979,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VFMADD132PSZ128r, X86::VFMADD132PSZ128mb, TB_BCAST_SS},
{X86::VFMADD132PSZ256r, X86::VFMADD132PSZ256mb, TB_BCAST_SS},
{X86::VFMADD132PSZr, X86::VFMADD132PSZmb, TB_BCAST_SS},
- {X86::VFMADD213NEPBF16Z128r, X86::VFMADD213NEPBF16Z128mb, TB_BCAST_SH},
- {X86::VFMADD213NEPBF16Z256r, X86::VFMADD213NEPBF16Z256mb, TB_BCAST_SH},
- {X86::VFMADD213NEPBF16Zr, X86::VFMADD213NEPBF16Zmb, TB_BCAST_SH},
+ {X86::VFMADD213BF16Z128r, X86::VFMADD213BF16Z128mb, TB_BCAST_SH},
+ {X86::VFMADD213BF16Z256r, X86::VFMADD213BF16Z256mb, TB_BCAST_SH},
+ {X86::VFMADD213BF16Zr, X86::VFMADD213BF16Zmb, TB_BCAST_SH},
{X86::VFMADD213PDZ128r, X86::VFMADD213PDZ128mb, TB_BCAST_SD},
{X86::VFMADD213PDZ256r, X86::VFMADD213PDZ256mb, TB_BCAST_SD},
{X86::VFMADD213PDZr, X86::VFMADD213PDZmb, TB_BCAST_SD},
@@ -8991,9 +8991,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VFMADD213PSZ128r, X86::VFMADD213PSZ128mb, TB_BCAST_SS},
{X86::VFMADD213PSZ256r, X86::VFMADD213PSZ256mb, TB_BCAST_SS},
{X86::VFMADD213PSZr, X86::VFMADD213PSZmb, TB_BCAST_SS},
- {X86::VFMADD231NEPBF16Z128r, X86::VFMADD231NEPBF16Z128mb, TB_BCAST_SH},
- {X86::VFMADD231NEPBF16Z256r, X86::VFMADD231NEPBF16Z256mb, TB_BCAST_SH},
- {X86::VFMADD231NEPBF16Zr, X86::VFMADD231NEPBF16Zmb, TB_BCAST_SH},
+ {X86::VFMADD231BF16Z128r, X86::VFMADD231BF16Z128mb, TB_BCAST_SH},
+ {X86::VFMADD231BF16Z256r, X86::VFMADD231BF16Z256mb, TB_BCAST_SH},
+ {X86::VFMADD231BF16Zr, X86::VFMADD231BF16Zmb, TB_BCAST_SH},
{X86::VFMADD231PDZ128r, X86::VFMADD231PDZ128mb, TB_BCAST_SD},
{X86::VFMADD231PDZ256r, X86::VFMADD231PDZ256mb, TB_BCAST_SD},
{X86::VFMADD231PDZr, X86::VFMADD231PDZmb, TB_BCAST_SD},
@@ -9033,9 +9033,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VFMADDSUB231PSZ128r, X86::VFMADDSUB231PSZ128mb, TB_BCAST_SS},
{X86::VFMADDSUB231PSZ256r, X86::VFMADDSUB231PSZ256mb, TB_BCAST_SS},
{X86::VFMADDSUB231PSZr, X86::VFMADDSUB231PSZmb, TB_BCAST_SS},
- {X86::VFMSUB132NEPBF16Z128r, X86::VFMSUB132NEPBF16Z128mb, TB_BCAST_SH},
- {X86::VFMSUB132NEPBF16Z256r, X86::VFMSUB132NEPBF16Z256mb, TB_BCAST_SH},
- {X86::VFMSUB132NEPBF16Zr, X86::VFMSUB132NEPBF16Zmb, TB_BCAST_SH},
+ {X86::VFMSUB132BF16Z128r, X86::VFMSUB132BF16Z128mb, TB_BCAST_SH},
+ {X86::VFMSUB132BF16Z256r, X86::VFMSUB132BF16Z256mb, TB_BCAST_SH},
+ {X86::VFMSUB132BF16Zr, X86::VFMSUB132BF16Zmb, TB_BCAST_SH},
{X86::VFMSUB132PDZ128r, X86::VFMSUB132PDZ128mb, TB_BCAST_SD},
{X86::VFMSUB132PDZ256r, X86::VFMSUB132PDZ256mb, TB_BCAST_SD},
{X86::VFMSUB132PDZr, X86::VFMSUB132PDZmb, TB_BCAST_SD},
@@ -9045,9 +9045,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VFMSUB132PSZ128r, X86::VFMSUB132PSZ128mb, TB_BCAST_SS},
{X86::VFMSUB132PSZ256r, X86::VFMSUB132PSZ256mb, TB_BCAST_SS},
{X86::VFMSUB132PSZr, X86::VFMSUB132PSZmb, TB_BCAST_SS},
- {X86::VFMSUB213NEPBF16Z128r, X86::VFMSUB213NEPBF16Z128mb, TB_BCAST_SH},
- {X86::VFMSUB213NEPBF16Z256r, X86::VFMSUB213NEPBF16Z256mb, TB_BCAST_SH},
- {X86::VFMSUB213NEPBF16Zr, X86::VFMSUB213NEPBF16Zmb, TB_BCAST_SH},
+ {X86::VFMSUB213BF16Z128r, X86::VFMSUB213BF16Z128mb, TB_BCAST_SH},
+ {X86::VFMSUB213BF16Z256r, X86::VFMSUB213BF16Z256mb, TB_BCAST_SH},
+ {X86::VFMSUB213BF16Zr, X86::VFMSUB213BF16Zmb, TB_BCAST_SH},
{X86::VFMSUB213PDZ128r, X86::VFMSUB213PDZ128mb, TB_BCAST_SD},
{X86::VFMSUB213PDZ256r, X86::VFMSUB213PDZ256mb, TB_BCAST_SD},
{X86::VFMSUB213PDZr, X86::VFMSUB213PDZmb, TB_BCAST_SD},
@@ -9057,9 +9057,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VFMSUB213PSZ128r, X86::VFMSUB213PSZ128mb, TB_BCAST_SS},
{X86::VFMSUB213PSZ256r, X86::VFMSUB213PSZ256mb, TB_BCAST_SS},
{X86::VFMSUB213PSZr, X86::VFMSUB213PSZmb, TB_BCAST_SS},
- {X86::VFMSUB231NEPBF16Z128r, X86::VFMSUB231NEPBF16Z128mb, TB_BCAST_SH},
- {X86::VFMSUB231NEPBF16Z256r, X86::VFMSUB231NEPBF16Z256mb, TB_BCAST_SH},
- {X86::VFMSUB231NEPBF16Zr, X86::VFMSUB231NEPBF16Zmb, TB_BCAST_SH},
+ {X86::VFMSUB231BF16Z128r, X86::VFMSUB231BF16Z128mb, TB_BCAST_SH},
+ {X86::VFMSUB231BF16Z256r, X86::VFMSUB231BF16Z256mb, TB_BCAST_SH},
+ {X86::VFMSUB231BF16Zr, X86::VFMSUB231BF16Zmb, TB_BCAST_SH},
{X86::VFMSUB231PDZ128r, X86::VFMSUB231PDZ128mb, TB_BCAST_SD},
{X86::VFMSUB231PDZ256r, X86::VFMSUB231PDZ256mb, TB_BCAST_SD},
{X86::VFMSUB231PDZr, X86::VFMSUB231PDZmb, TB_BCAST_SD},
@@ -9099,9 +9099,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VFMULCPHZ128rrkz, X86::VFMULCPHZ128rmbkz, TB_BCAST_SS},
{X86::VFMULCPHZ256rrkz, X86::VFMULCPHZ256rmbkz, TB_BCAST_SS},
{X86::VFMULCPHZrrkz, X86::VFMULCPHZrmbkz, TB_BCAST_SS},
- {X86::VFNMADD132NEPBF16Z128r, X86::VFNMADD132NEPBF16Z128mb, TB_BCAST_SH},
- {X86::VFNMADD132NEPBF16Z256r, X86::VFNMADD132NEPBF16Z256mb, TB_BCAST_SH},
- {X86::VFNMADD132NEPBF16Zr, X86::VFNMADD132NEPBF16Zmb, TB_BCAST_SH},
+ {X86::VFNMADD132BF16Z128r, X86::VFNMADD132BF16Z128mb, TB_BCAST_SH},
+ {X86::VFNMADD132BF16Z256r, X86::VFNMADD132BF16Z256mb, TB_BCAST_SH},
+ {X86::VFNMADD132BF16Zr, X86::VFNMADD132BF16Zmb, TB_BCAST_SH},
{X86::VFNMADD132PDZ128r, X86::VFNMADD132PDZ128mb, TB_BCAST_SD},
{X86::VFNMADD132PDZ256r, X86::VFNMADD132PDZ256mb, TB_BCAST_SD},
{X86::VFNMADD132PDZr, X86::VFNMADD132PDZmb, TB_BCAST_SD},
@@ -9111,9 +9111,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VFNMADD132PSZ128r, X86::VFNMADD132PSZ128mb, TB_BCAST_SS},
{X86::VFNMADD132PSZ256r, X86::VFNMADD132PSZ256mb, TB_BCAST_SS},
{X86::VFNMADD132PSZr, X86::VFNMADD132PSZmb, TB_BCAST_SS},
- {X86::VFNMADD213NEPBF16Z128r, X86::VFNMADD213NEPBF16Z128mb, TB_BCAST_SH},
- {X86::VFNMADD213NEPBF16Z256r, X86::VFNMADD213NEPBF16Z256mb, TB_BCAST_SH},
- {X86::VFNMADD213NEPBF16Zr, X86::VFNMADD213NEPBF16Zmb, TB_BCAST_SH},
+ {X86::VFNMADD213BF16Z128r, X86::VFNMADD213BF16Z128mb, TB_BCAST_SH},
+ {X86::VFNMADD213BF16Z256r, X86::VFNMADD213BF16Z256mb, TB_BCAST_SH},
+ {X86::VFNMADD213BF16Zr, X86::VFNMADD213BF16Zmb, TB_BCAST_SH},
{X86::VFNMADD213PDZ128r, X86::VFNMADD213PDZ128mb, TB_BCAST_SD},
{X86::VFNMADD213PDZ256r, X86::VFNMADD213PDZ256mb, TB_BCAST_SD},
{X86::VFNMADD213PDZr, X86::VFNMADD213PDZmb, TB_BCAST_SD},
@@ -9123,9 +9123,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VFNMADD213PSZ128r, X86::VFNMADD213PSZ128mb, TB_BCAST_SS},
{X86::VFNMADD213PSZ256r, X86::VFNMADD213PSZ256mb, TB_BCAST_SS},
{X86::VFNMADD213PSZr, X86::VFNMADD213PSZmb, TB_BCAST_SS},
- {X86::VFNMADD231NEPBF16Z128r, X86::VFNMADD231NEPBF16Z128mb, TB_BCAST_SH},
- {X86::VFNMADD231NEPBF16Z256r, X86::VFNMADD231NEPBF16Z256mb, TB_BCAST_SH},
- {X86::VFNMADD231NEPBF16Zr, X86::VFNMADD231NEPBF16Zmb, TB_BCAST_SH},
+ {X86::VFNMADD231BF16Z128r, X86::VFNMADD231BF16Z128mb, TB_BCAST_SH},
+ {X86::VFNMADD231BF16Z256r, X86::VFNMADD231BF16Z256mb, TB_BCAST_SH},
+ {X86::VFNMADD231BF16Zr, X86::VFNMADD231BF16Zmb, TB_BCAST_SH},
{X86::VFNMADD231PDZ128r, X86::VFNMADD231PDZ128mb, TB_BCAST_SD},
{X86::VFNMADD231PDZ256r, X86::VFNMADD231PDZ256mb, TB_BCAST_SD},
{X86::VFNMADD231PDZr, X86::VFNMADD231PDZmb, TB_BCAST_SD},
@@ -9135,9 +9135,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VFNMADD231PSZ128r, X86::VFNMADD231PSZ128mb, TB_BCAST_SS},
{X86::VFNMADD231PSZ256r, X86::VFNMADD231PSZ256mb, TB_BCAST_SS},
{X86::VFNMADD231PSZr, X86::VFNMADD231PSZmb, TB_BCAST_SS},
- {X86::VFNMSUB132NEPBF16Z128r, X86::VFNMSUB132NEPBF16Z128mb, TB_BCAST_SH},
- {X86::VFNMSUB132NEPBF16Z256r, X86::VFNMSUB132NEPBF16Z256mb, TB_BCAST_SH},
- {X86::VFNMSUB132NEPBF16Zr, X86::VFNMSUB132NEPBF16Zmb, TB_BCAST_SH},
+ {X86::VFNMSUB132BF16Z128r, X86::VFNMSUB132BF16Z128mb, TB_BCAST_SH},
+ {X86::VFNMSUB132BF16Z256r, X86::VFNMSUB132BF16Z256mb, TB_BCAST_SH},
+ {X86::VFNMSUB132BF16Zr, X86::VFNMSUB132BF16Zmb, TB_BCAST_SH},
{X86::VFNMSUB132PDZ128r, X86::VFNMSUB132PDZ128mb, TB_BCAST_SD},
{X86::VFNMSUB132PDZ256r, X86::VFNMSUB132PDZ256mb, TB_BCAST_SD},
{X86::VFNMSUB132PDZr, X86::VFNMSUB132PDZmb, TB_BCAST_SD},
@@ -9147,9 +9147,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VFNMSUB132PSZ128r, X86::VFNMSUB132PSZ128mb, TB_BCAST_SS},
{X86::VFNMSUB132PSZ256r, X86::VFNMSUB132PSZ256mb, TB_BCAST_SS},
{X86::VFNMSUB132PSZr, X86::VFNMSUB132PSZmb, TB_BCAST_SS},
- {X86::VFNMSUB213NEPBF16Z128r, X86::VFNMSUB213NEPBF16Z128mb, TB_BCAST_SH},
- {X86::VFNMSUB213NEPBF16Z256r, X86::VFNMSUB213NEPBF16Z256mb, TB_BCAST_SH},
- {X86::VFNMSUB213NEPBF16Zr, X86::VFNMSUB213NEPBF16Zmb, TB_BCAST_SH},
+ {X86::VFNMSUB213BF16Z128r, X86::VFNMSUB213BF16Z128mb, TB_BCAST_SH},
+ {X86::VFNMSUB213BF16Z256r, X86::VFNMSUB213BF16Z256mb, TB_BCAST_SH},
+ {X86::VFNMSUB213BF16Zr, X86::VFNMSUB213BF16Zmb, TB_BCAST_SH},
{X86::VFNMSUB213PDZ128r, X86::VFNMSUB213PDZ128mb, TB_BCAST_SD},
{X86::VFNMSUB213PDZ256r, X86::VFNMSUB213PDZ256mb, TB_BCAST_SD},
{X86::VFNMSUB213PDZr, X86::VFNMSUB213PDZmb, TB_BCAST_SD},
@@ -9159,9 +9159,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VFNMSUB213PSZ128r, X86::VFNMSUB213PSZ128mb, TB_BCAST_SS},
{X86::VFNMSUB213PSZ256r, X86::VFNMSUB213PSZ256mb, TB_BCAST_SS},
{X86::VFNMSUB213PSZr, X86::VFNMSUB213PSZmb, TB_BCAST_SS},
- {X86::VFNMSUB231NEPBF16Z128r, X86::VFNMSUB231NEPBF16Z128mb, TB_BCAST_SH},
- {X86::VFNMSUB231NEPBF16Z256r, X86::VFNMSUB231NEPBF16Z256mb, TB_BCAST_SH},
- {X86::VFNMSUB231NEPBF16Zr, X86::VFNMSUB231NEPBF16Zmb, TB_BCAST_SH},
+ {X86::VFNMSUB231BF16Z128r, X86::VFNMSUB231BF16Z128mb, TB_BCAST_SH},
+ {X86::VFNMSUB231BF16Z256r, X86::VFNMSUB231BF16Z256mb, TB_BCAST_SH},
+ {X86::VFNMSUB231BF16Zr, X86::VFNMSUB231BF16Zmb, TB_BCAST_SH},
{X86::VFNMSUB231PDZ128r, X86::VFNMSUB231PDZ128mb, TB_BCAST_SD},
{X86::VFNMSUB231PDZ256r, X86::VFNMSUB231PDZ256mb, TB_BCAST_SD},
{X86::VFNMSUB231PDZr, X86::VFNMSUB231PDZmb, TB_BCAST_SD},
@@ -9171,9 +9171,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VFNMSUB231PSZ128r, X86::VFNMSUB231PSZ128mb, TB_BCAST_SS},
{X86::VFNMSUB231PSZ256r, X86::VFNMSUB231PSZ256mb, TB_BCAST_SS},
{X86::VFNMSUB231PSZr, X86::VFNMSUB231PSZmb, TB_BCAST_SS},
- {X86::VGETEXPPBF16Z128rk, X86::VGETEXPPBF16Z128mbk, TB_BCAST_SH},
- {X86::VGETEXPPBF16Z256rk, X86::VGETEXPPBF16Z256mbk, TB_BCAST_SH},
- {X86::VGETEXPPBF16Zrk, X86::VGETEXPPBF16Zmbk, TB_BCAST_SH},
+ {X86::VGETEXPBF16Z128rk, X86::VGETEXPBF16Z128mbk, TB_BCAST_SH},
+ {X86::VGETEXPBF16Z256rk, X86::VGETEXPBF16Z256mbk, TB_BCAST_SH},
+ {X86::VGETEXPBF16Zrk, X86::VGETEXPBF16Zmbk, TB_BCAST_SH},
{X86::VGETEXPPDZ128rk, X86::VGETEXPPDZ128mbk, TB_BCAST_SD},
{X86::VGETEXPPDZ256rk, X86::VGETEXPPDZ256mbk, TB_BCAST_SD},
{X86::VGETEXPPDZrk, X86::VGETEXPPDZmbk, TB_BCAST_SD},
@@ -9183,9 +9183,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VGETEXPPSZ128rk, X86::VGETEXPPSZ128mbk, TB_BCAST_SS},
{X86::VGETEXPPSZ256rk, X86::VGETEXPPSZ256mbk, TB_BCAST_SS},
{X86::VGETEXPPSZrk, X86::VGETEXPPSZmbk, TB_BCAST_SS},
- {X86::VGETMANTPBF16Z128rrik, X86::VGETMANTPBF16Z128rmbik, TB_BCAST_SH},
- {X86::VGETMANTPBF16Z256rrik, X86::VGETMANTPBF16Z256rmbik, TB_BCAST_SH},
- {X86::VGETMANTPBF16Zrrik, X86::VGETMANTPBF16Zrmbik, TB_BCAST_SH},
+ {X86::VGETMANTBF16Z128rrik, X86::VGETMANTBF16Z128rmbik, TB_BCAST_SH},
+ {X86::VGETMANTBF16Z256rrik, X86::VGETMANTBF16Z256rmbik, TB_BCAST_SH},
+ {X86::VGETMANTBF16Zrrik, X86::VGETMANTBF16Zrmbik, TB_BCAST_SH},
{X86::VGETMANTPDZ128rrik, X86::VGETMANTPDZ128rmbik, TB_BCAST_SD},
{X86::VGETMANTPDZ256rrik, X86::VGETMANTPDZ256rmbik, TB_BCAST_SD},
{X86::VGETMANTPDZrrik, X86::VGETMANTPDZrmbik, TB_BCAST_SD},
@@ -9201,6 +9201,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VGF2P8AFFINEQBZ128rrikz, X86::VGF2P8AFFINEQBZ128rmbikz, TB_BCAST_Q},
{X86::VGF2P8AFFINEQBZ256rrikz, X86::VGF2P8AFFINEQBZ256rmbikz, TB_BCAST_Q},
{X86::VGF2P8AFFINEQBZrrikz, X86::VGF2P8AFFINEQBZrmbikz, TB_BCAST_Q},
+ {X86::VMAXBF16Z128rrkz, X86::VMAXBF16Z128rmbkz, TB_BCAST_SH},
+ {X86::VMAXBF16Z256rrkz, X86::VMAXBF16Z256rmbkz, TB_BCAST_SH},
+ {X86::VMAXBF16Zrrkz, X86::VMAXBF16Zrmbkz, TB_BCAST_SH},
{X86::VMAXCPDZ128rrkz, X86::VMAXCPDZ128rmbkz, TB_BCAST_SD},
{X86::VMAXCPDZ256rrkz, X86::VMAXCPDZ256rmbkz, TB_BCAST_SD},
{X86::VMAXCPDZrrkz, X86::VMAXCPDZrmbkz, TB_BCAST_SD},
@@ -9210,9 +9213,6 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VMAXCPSZ128rrkz, X86::VMAXCPSZ128rmbkz, TB_BCAST_SS},
{X86::VMAXCPSZ256rrkz, X86::VMAXCPSZ256rmbkz, TB_BCAST_SS},
{X86::VMAXCPSZrrkz, X86::VMAXCPSZrmbkz, TB_BCAST_SS},
- {X86::VMAXPBF16Z128rrkz, X86::VMAXPBF16Z128rmbkz, TB_BCAST_SH},
- {X86::VMAXPBF16Z256rrkz, X86::VMAXPBF16Z256rmbkz, TB_BCAST_SH},
- {X86::VMAXPBF16Zrrkz, X86::VMAXPBF16Zrmbkz, TB_BCAST_SH},
{X86::VMAXPDZ128rrkz, X86::VMAXPDZ128rmbkz, TB_BCAST_SD},
{X86::VMAXPDZ256rrkz, X86::VMAXPDZ256rmbkz, TB_BCAST_SD},
{X86::VMAXPDZrrkz, X86::VMAXPDZrmbkz, TB_BCAST_SD},
@@ -9222,6 +9222,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VMAXPSZ128rrkz, X86::VMAXPSZ128rmbkz, TB_BCAST_SS},
{X86::VMAXPSZ256rrkz, X86::VMAXPSZ256rmbkz, TB_BCAST_SS},
{X86::VMAXPSZrrkz, X86::VMAXPSZrmbkz, TB_BCAST_SS},
+ {X86::VMINBF16Z128rrkz, X86::VMINBF16Z128rmbkz, TB_BCAST_SH},
+ {X86::VMINBF16Z256rrkz, X86::VMINBF16Z256rmbkz, TB_BCAST_SH},
+ {X86::VMINBF16Zrrkz, X86::VMINBF16Zrmbkz, TB_BCAST_SH},
{X86::VMINCPDZ128rrkz, X86::VMINCPDZ128rmbkz, TB_BCAST_SD},
{X86::VMINCPDZ256rrkz, X86::VMINCPDZ256rmbkz, TB_BCAST_SD},
{X86::VMINCPDZrrkz, X86::VMINCPDZrmbkz, TB_BCAST_SD},
@@ -9243,9 +9246,6 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VMINMAXPSZ128rrikz, X86::VMINMAXPSZ128rmbikz, TB_BCAST_SS},
{X86::VMINMAXPSZ256rrikz, X86::VMINMAXPSZ256rmbikz, TB_BCAST_SS},
{X86::VMINMAXPSZrrikz, X86::VMINMAXPSZrmbikz, TB_BCAST_SS},
- {X86::VMINPBF16Z128rrkz, X86::VMINPBF16Z128rmbkz, TB_BCAST_SH},
- {X86::VMINPBF16Z256rrkz, X86::VMINPBF16Z256rmbkz, TB_BCAST_SH},
- {X86::VMINPBF16Zrrkz, X86::VMINPBF16Zrmbkz, TB_BCAST_SH},
{X86::VMINPDZ128rrkz, X86::VMINPDZ128rmbkz, TB_BCAST_SD},
{X86::VMINPDZ256rrkz, X86::VMINPDZ256rmbkz, TB_BCAST_SD},
{X86::VMINPDZrrkz, X86::VMINPDZrmbkz, TB_BCAST_SD},
@@ -9255,9 +9255,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VMINPSZ128rrkz, X86::VMINPSZ128rmbkz, TB_BCAST_SS},
{X86::VMINPSZ256rrkz, X86::VMINPSZ256rmbkz, TB_BCAST_SS},
{X86::VMINPSZrrkz, X86::VMINPSZrmbkz, TB_BCAST_SS},
- {X86::VMULNEPBF16Z128rrkz, X86::VMULNEPBF16Z128rmbkz, TB_BCAST_SH},
- {X86::VMULNEPBF16Z256rrkz, X86::VMULNEPBF16Z256rmbkz, TB_BCAST_SH},
- {X86::VMULNEPBF16Zrrkz, X86::VMULNEPBF16Zrmbkz, TB_BCAST_SH},
+ {X86::VMULBF16Z128rrkz, X86::VMULBF16Z128rmbkz, TB_BCAST_SH},
+ {X86::VMULBF16Z256rrkz, X86::VMULBF16Z256rmbkz, TB_BCAST_SH},
+ {X86::VMULBF16Zrrkz, X86::VMULBF16Zrmbkz, TB_BCAST_SH},
{X86::VMULPDZ128rrkz, X86::VMULPDZ128rmbkz, TB_BCAST_SD},
{X86::VMULPDZ256rrkz, X86::VMULPDZ256rmbkz, TB_BCAST_SD},
{X86::VMULPDZrrkz, X86::VMULPDZrmbkz, TB_BCAST_SD},
@@ -9641,15 +9641,15 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VRCP14PSZrk, X86::VRCP14PSZmbk, TB_BCAST_SS},
{X86::VRCP28PDZrk, X86::VRCP28PDZmbk, TB_BCAST_SD},
{X86::VRCP28PSZrk, X86::VRCP28PSZmbk, TB_BCAST_SS},
- {X86::VRCPPBF16Z128rk, X86::VRCPPBF16Z128mbk, TB_BCAST_SH},
- {X86::VRCPPBF16Z256rk, X86::VRCPPBF16Z256mbk, TB_BCAST_SH},
- {X86::VRCPPBF16Zrk, X86::VRCPPBF16Zmbk, TB_BCAST_SH},
+ {X86::VRCPBF16Z128rk, X86::VRCPBF16Z128mbk, TB_BCAST_SH},
+ {X86::VRCPBF16Z256rk, X86::VRCPBF16Z256mbk, TB_BCAST_SH},
+ {X86::VRCPBF16Zrk, X86::VRCPBF16Zmbk, TB_BCAST_SH},
{X86::VRCPPHZ128rk, X86::VRCPPHZ128mbk, TB_BCAST_SH},
{X86::VRCPPHZ256rk, X86::VRCPPHZ256mbk, TB_BCAST_SH},
{X86::VRCPPHZrk, X86::VRCPPHZmbk, TB_BCAST_SH},
- {X86::VREDUCENEPBF16Z128rrik, X86::VREDUCENEPBF16Z128rmbik, TB_BCAST_SH},
- {X86::VREDUCENEPBF16Z256rrik, X86::VREDUCENEPBF16Z256rmbik, TB_BCAST_SH},
- {X86::VREDUCENEPBF16Zrrik, X86::VREDUCENEPBF16Zrmbik, TB_BCAST_SH},
+ {X86::VREDUCEBF16Z128rrik, X86::VREDUCEBF16Z128rmbik, TB_BCAST_SH},
+ {X86::VREDUCEBF16Z256rrik, X86::VREDUCEBF16Z256rmbik, TB_BCAST_SH},
+ {X86::VREDUCEBF16Zrrik, X86::VREDUCEBF16Zrmbik, TB_BCAST_SH},
{X86::VREDUCEPDZ128rrik, X86::VREDUCEPDZ128rmbik, TB_BCAST_SD},
{X86::VREDUCEPDZ256rrik, X86::VREDUCEPDZ256rmbik, TB_BCAST_SD},
{X86::VREDUCEPDZrrik, X86::VREDUCEPDZrmbik, TB_BCAST_SD},
@@ -9659,9 +9659,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VREDUCEPSZ128rrik, X86::VREDUCEPSZ128rmbik, TB_BCAST_SS},
{X86::VREDUCEPSZ256rrik, X86::VREDUCEPSZ256rmbik, TB_BCAST_SS},
{X86::VREDUCEPSZrrik, X86::VREDUCEPSZrmbik, TB_BCAST_SS},
- {X86::VRNDSCALENEPBF16Z128rrik, X86::VRNDSCALENEPBF16Z128rmbik, TB_BCAST_SH},
- {X86::VRNDSCALENEPBF16Z256rrik, X86::VRNDSCALENEPBF16Z256rmbik, TB_BCAST_SH},
- {X86::VRNDSCALENEPBF16Zrrik, X86::VRNDSCALENEPBF16Zrmbik, TB_BCAST_SH},
+ {X86::VRNDSCALEBF16Z128rrik, X86::VRNDSCALEBF16Z128rmbik, TB_BCAST_SH},
+ {X86::VRNDSCALEBF16Z256rrik, X86::VRNDSCALEBF16Z256rmbik, TB_BCAST_SH},
+ {X86::VRNDSCALEBF16Zrrik, X86::VRNDSCALEBF16Zrmbik, TB_BCAST_SH},
{X86::VRNDSCALEPDZ128rrik, X86::VRNDSCALEPDZ128rmbik, TB_BCAST_SD},
{X86::VRNDSCALEPDZ256rrik, X86::VRNDSCALEPDZ256rmbik, TB_BCAST_SD},
{X86::VRNDSCALEPDZrrik, X86::VRNDSCALEPDZrmbik, TB_BCAST_SD},
@@ -9679,15 +9679,15 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VRSQRT14PSZrk, X86::VRSQRT14PSZmbk, TB_BCAST_SS},
{X86::VRSQRT28PDZrk, X86::VRSQRT28PDZmbk, TB_BCAST_SD},
{X86::VRSQRT28PSZrk, X86::VRSQRT28PSZmbk, TB_BCAST_SS},
- {X86::VRSQRTPBF16Z128rk, X86::VRSQRTPBF16Z128mbk, TB_BCAST_SH},
- {X86::VRSQRTPBF16Z256rk, X86::VRSQRTPBF16Z256mbk, TB_BCAST_SH},
- {X86::VRSQRTPBF16Zrk, X86::VRSQRTPBF16Zmbk, TB_BCAST_SH},
+ {X86::VRSQRTBF16Z128rk, X86::VRSQRTBF16Z128mbk, TB_BCAST_SH},
+ {X86::VRSQRTBF16Z256rk, X86::VRSQRTBF16Z256mbk, TB_BCAST_SH},
+ {X86::VRSQRTBF16Zrk, X86::VRSQRTBF16Zmbk, TB_BCAST_SH},
{X86::VRSQRTPHZ128rk, X86::VRSQRTPHZ128mbk, TB_BCAST_SH},
{X86::VRSQRTPHZ256rk, X86::VRSQRTPHZ256mbk, TB_BCAST_SH},
{X86::VRSQRTPHZrk, X86::VRSQRTPHZmbk, TB_BCAST_SH},
- {X86::VSCALEFPBF16Z128rrkz, X86::VSCALEFPBF16Z128rmbkz, TB_BCAST_SH},
- {X86::VSCALEFPBF16Z256rrkz, X86::VSCALEFPBF16Z256rmbkz, TB_BCAST_SH},
- {X86::VSCALEFPBF16Zrrkz, X86::VSCALEFPBF16Zrmbkz, TB_BCAST_SH},
+ {X86::VSCALEFBF16Z128rrkz, X86::VSCALEFBF16Z128rmbkz, TB_BCAST_SH},
+ {X86::VSCALEFBF16Z256rrkz, X86::VSCALEFBF16Z256rmbkz, TB_BCAST_SH},
+ {X86::VSCALEFBF16Zrrkz, X86::VSCALEFBF16Zrmbkz, TB_BCAST_SH},
{X86::VSCALEFPDZ128rrkz, X86::VSCALEFPDZ128rmbkz, TB_BCAST_SD},
{X86::VSCALEFPDZ256rrkz, X86::VSCALEFPDZ256rmbkz, TB_BCAST_SD},
{X86::VSCALEFPDZrrkz, X86::VSCALEFPDZrmbkz, TB_BCAST_SD},
@@ -9711,9 +9711,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VSHUFPSZ128rrikz, X86::VSHUFPSZ128rmbikz, TB_BCAST_SS},
{X86::VSHUFPSZ256rrikz, X86::VSHUFPSZ256rmbikz, TB_BCAST_SS},
{X86::VSHUFPSZrrikz, X86::VSHUFPSZrmbikz, TB_BCAST_SS},
- {X86::VSQRTNEPBF16Z128rk, X86::VSQRTNEPBF16Z128mbk, TB_BCAST_SH},
- {X86::VSQRTNEPBF16Z256rk, X86::VSQRTNEPBF16Z256mbk, TB_BCAST_SH},
- {X86::VSQRTNEPBF16Zrk, X86::VSQRTNEPBF16Zmbk, TB_BCAST_SH},
+ {X86::VSQRTBF16Z128rk, X86::VSQRTBF16Z128mbk, TB_BCAST_SH},
+ {X86::VSQRTBF16Z256rk, X86::VSQRTBF16Z256mbk, TB_BCAST_SH},
+ {X86::VSQRTBF16Zrk, X86::VSQRTBF16Zmbk, TB_BCAST_SH},
{X86::VSQRTPDZ128rk, X86::VSQRTPDZ128mbk, TB_BCAST_SD},
{X86::VSQRTPDZ256rk, X86::VSQRTPDZ256mbk, TB_BCAST_SD},
{X86::VSQRTPDZrk, X86::VSQRTPDZmbk, TB_BCAST_SD},
@@ -9723,9 +9723,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
{X86::VSQRTPSZ128rk, X86::VSQRTPSZ128mbk, TB_BCAST_SS},
{X86::VSQRTPSZ256rk, X86::VSQRTPSZ256mbk, TB_BCAST_SS},
{X86::VSQRTPSZrk, X86::VSQRTPSZmbk, TB_BCAST_SS},
- {X86::VSUBNEPBF16Z128rrkz, X86::VSUBNEPBF16Z128rmbkz, TB_BCAST_SH},
- {X86::VSUBNEPBF16Z256rrkz, X86::VSUBNEPBF16Z256rmbkz, TB_BCAST_SH},
- {X86::VSUBNEPBF16Zrrkz, X86::VSUBNEPBF16Zrmbkz, TB_BCAST_SH},
+ {X86::VSUBBF16Z128rrkz, X86::VSUBBF16Z128rmbkz, TB_BCAST_SH},
+ {X86::VSUBBF16Z256rrkz, X86::VSUBBF16Z256rmbkz, TB_BCAST_SH},
+ {X86::VSUBBF16Zrrkz, X86::VSUBBF16Zrmbkz, TB_BCAST_SH},
{X86::VSUBPDZ128rrkz, X86::VSUBPDZ128rmbkz, TB_BCAST_SD},
{X86::VSUBPDZ256rrkz, X86::VSUBPDZ256rmbkz, TB_BCAST_SD},
{X86::VSUBPDZrrkz, X86::VSUBPDZrmbkz, TB_BCAST_SD},
@@ -9756,9 +9756,9 @@ static const X86FoldTableEntry BroadcastTable3[] = {
};
static const X86FoldTableEntry BroadcastTable4[] = {
- {X86::VADDNEPBF16Z128rrk, X86::VADDNEPBF16Z128rmbk, TB_BCAST_SH},
- {X86::VADDNEPBF16Z256rrk, X86::VADDNEPBF16Z256rmbk, TB_BCAST_SH},
- {X86::VADDNEPBF16Zrrk, X86::VADDNEPBF16Zrmbk, TB_BCAST_SH},
+ {X86::VADDBF16Z128rrk, X86::VADDBF16Z128rmbk, TB_BCAST_SH},
+ {X86::VADDBF16Z256rrk, X86::VADDBF16Z256rmbk, TB_BCAST_SH},
+ {X86::VADDBF16Zrrk, X86::VADDBF16Zrmbk, TB_BCAST_SH},
{X86::VADDPDZ128rrk, X86::VADDPDZ128rmbk, TB_BCAST_SD},
{X86::VADDPDZ256rrk, X86::VADDPDZ256rmbk, TB_BCAST_SD},
{X86::VADDPDZrrk, X86::VADDPDZrmbk, TB_BCAST_SD},
@@ -9816,9 +9816,9 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VCVTNE2PS2BF16Z128rrk, X86::VCVTNE2PS2BF16Z128rmbk, TB_BCAST_SS},
{X86::VCVTNE2PS2BF16Z256rrk, X86::VCVTNE2PS2BF16Z256rmbk, TB_BCAST_SS},
{X86::VCVTNE2PS2BF16Zrrk, X86::VCVTNE2PS2BF16Zrmbk, TB_BCAST_SS},
- {X86::VDIVNEPBF16Z128rrk, X86::VDIVNEPBF16Z128rmbk, TB_BCAST_SH},
- {X86::VDIVNEPBF16Z256rrk, X86::VDIVNEPBF16Z256rmbk, TB_BCAST_SH},
- {X86::VDIVNEPBF16Zrrk, X86::VDIVNEPBF16Zrmbk, TB_BCAST_SH},
+ {X86::VDIVBF16Z128rrk, X86::VDIVBF16Z128rmbk, TB_BCAST_SH},
+ {X86::VDIVBF16Z256rrk, X86::VDIVBF16Z256rmbk, TB_BCAST_SH},
+ {X86::VDIVBF16Zrrk, X86::VDIVBF16Zrmbk, TB_BCAST_SH},
{X86::VDIVPDZ128rrk, X86::VDIVPDZ128rmbk, TB_BCAST_SD},
{X86::VDIVPDZ256rrk, X86::VDIVPDZ256rmbk, TB_BCAST_SD},
{X86::VDIVPDZrrk, X86::VDIVPDZrmbk, TB_BCAST_SD},
@@ -9861,12 +9861,12 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VFIXUPIMMPSZ256rrikz, X86::VFIXUPIMMPSZ256rmbikz, TB_BCAST_SS},
{X86::VFIXUPIMMPSZrrik, X86::VFIXUPIMMPSZrmbik, TB_BCAST_SS},
{X86::VFIXUPIMMPSZrrikz, X86::VFIXUPIMMPSZrmbikz, TB_BCAST_SS},
- {X86::VFMADD132NEPBF16Z128rk, X86::VFMADD132NEPBF16Z128mbk, TB_BCAST_SH},
- {X86::VFMADD132NEPBF16Z128rkz, X86::VFMADD132NEPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VFMADD132NEPBF16Z256rk, X86::VFMADD132NEPBF16Z256mbk, TB_BCAST_SH},
- {X86::VFMADD132NEPBF16Z256rkz, X86::VFMADD132NEPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VFMADD132NEPBF16Zrk, X86::VFMADD132NEPBF16Zmbk, TB_BCAST_SH},
- {X86::VFMADD132NEPBF16Zrkz, X86::VFMADD132NEPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VFMADD132BF16Z128rk, X86::VFMADD132BF16Z128mbk, TB_BCAST_SH},
+ {X86::VFMADD132BF16Z128rkz, X86::VFMADD132BF16Z128mbkz, TB_BCAST_SH},
+ {X86::VFMADD132BF16Z256rk, X86::VFMADD132BF16Z256mbk, TB_BCAST_SH},
+ {X86::VFMADD132BF16Z256rkz, X86::VFMADD132BF16Z256mbkz, TB_BCAST_SH},
+ {X86::VFMADD132BF16Zrk, X86::VFMADD132BF16Zmbk, TB_BCAST_SH},
+ {X86::VFMADD132BF16Zrkz, X86::VFMADD132BF16Zmbkz, TB_BCAST_SH},
{X86::VFMADD132PDZ128rk, X86::VFMADD132PDZ128mbk, TB_BCAST_SD},
{X86::VFMADD132PDZ128rkz, X86::VFMADD132PDZ128mbkz, TB_BCAST_SD},
{X86::VFMADD132PDZ256rk, X86::VFMADD132PDZ256mbk, TB_BCAST_SD},
@@ -9885,12 +9885,12 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VFMADD132PSZ256rkz, X86::VFMADD132PSZ256mbkz, TB_BCAST_SS},
{X86::VFMADD132PSZrk, X86::VFMADD132PSZmbk, TB_BCAST_SS},
{X86::VFMADD132PSZrkz, X86::VFMADD132PSZmbkz, TB_BCAST_SS},
- {X86::VFMADD213NEPBF16Z128rk, X86::VFMADD213NEPBF16Z128mbk, TB_BCAST_SH},
- {X86::VFMADD213NEPBF16Z128rkz, X86::VFMADD213NEPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VFMADD213NEPBF16Z256rk, X86::VFMADD213NEPBF16Z256mbk, TB_BCAST_SH},
- {X86::VFMADD213NEPBF16Z256rkz, X86::VFMADD213NEPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VFMADD213NEPBF16Zrk, X86::VFMADD213NEPBF16Zmbk, TB_BCAST_SH},
- {X86::VFMADD213NEPBF16Zrkz, X86::VFMADD213NEPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VFMADD213BF16Z128rk, X86::VFMADD213BF16Z128mbk, TB_BCAST_SH},
+ {X86::VFMADD213BF16Z128rkz, X86::VFMADD213BF16Z128mbkz, TB_BCAST_SH},
+ {X86::VFMADD213BF16Z256rk, X86::VFMADD213BF16Z256mbk, TB_BCAST_SH},
+ {X86::VFMADD213BF16Z256rkz, X86::VFMADD213BF16Z256mbkz, TB_BCAST_SH},
+ {X86::VFMADD213BF16Zrk, X86::VFMADD213BF16Zmbk, TB_BCAST_SH},
+ {X86::VFMADD213BF16Zrkz, X86::VFMADD213BF16Zmbkz, TB_BCAST_SH},
{X86::VFMADD213PDZ128rk, X86::VFMADD213PDZ128mbk, TB_BCAST_SD},
{X86::VFMADD213PDZ128rkz, X86::VFMADD213PDZ128mbkz, TB_BCAST_SD},
{X86::VFMADD213PDZ256rk, X86::VFMADD213PDZ256mbk, TB_BCAST_SD},
@@ -9909,12 +9909,12 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VFMADD213PSZ256rkz, X86::VFMADD213PSZ256mbkz, TB_BCAST_SS},
{X86::VFMADD213PSZrk, X86::VFMADD213PSZmbk, TB_BCAST_SS},
{X86::VFMADD213PSZrkz, X86::VFMADD213PSZmbkz, TB_BCAST_SS},
- {X86::VFMADD231NEPBF16Z128rk, X86::VFMADD231NEPBF16Z128mbk, TB_BCAST_SH},
- {X86::VFMADD231NEPBF16Z128rkz, X86::VFMADD231NEPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VFMADD231NEPBF16Z256rk, X86::VFMADD231NEPBF16Z256mbk, TB_BCAST_SH},
- {X86::VFMADD231NEPBF16Z256rkz, X86::VFMADD231NEPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VFMADD231NEPBF16Zrk, X86::VFMADD231NEPBF16Zmbk, TB_BCAST_SH},
- {X86::VFMADD231NEPBF16Zrkz, X86::VFMADD231NEPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VFMADD231BF16Z128rk, X86::VFMADD231BF16Z128mbk, TB_BCAST_SH},
+ {X86::VFMADD231BF16Z128rkz, X86::VFMADD231BF16Z128mbkz, TB_BCAST_SH},
+ {X86::VFMADD231BF16Z256rk, X86::VFMADD231BF16Z256mbk, TB_BCAST_SH},
+ {X86::VFMADD231BF16Z256rkz, X86::VFMADD231BF16Z256mbkz, TB_BCAST_SH},
+ {X86::VFMADD231BF16Zrk, X86::VFMADD231BF16Zmbk, TB_BCAST_SH},
+ {X86::VFMADD231BF16Zrkz, X86::VFMADD231BF16Zmbkz, TB_BCAST_SH},
{X86::VFMADD231PDZ128rk, X86::VFMADD231PDZ128mbk, TB_BCAST_SD},
{X86::VFMADD231PDZ128rkz, X86::VFMADD231PDZ128mbkz, TB_BCAST_SD},
{X86::VFMADD231PDZ256rk, X86::VFMADD231PDZ256mbk, TB_BCAST_SD},
@@ -9993,12 +9993,12 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VFMADDSUB231PSZ256rkz, X86::VFMADDSUB231PSZ256mbkz, TB_BCAST_SS},
{X86::VFMADDSUB231PSZrk, X86::VFMADDSUB231PSZmbk, TB_BCAST_SS},
{X86::VFMADDSUB231PSZrkz, X86::VFMADDSUB231PSZmbkz, TB_BCAST_SS},
- {X86::VFMSUB132NEPBF16Z128rk, X86::VFMSUB132NEPBF16Z128mbk, TB_BCAST_SH},
- {X86::VFMSUB132NEPBF16Z128rkz, X86::VFMSUB132NEPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VFMSUB132NEPBF16Z256rk, X86::VFMSUB132NEPBF16Z256mbk, TB_BCAST_SH},
- {X86::VFMSUB132NEPBF16Z256rkz, X86::VFMSUB132NEPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VFMSUB132NEPBF16Zrk, X86::VFMSUB132NEPBF16Zmbk, TB_BCAST_SH},
- {X86::VFMSUB132NEPBF16Zrkz, X86::VFMSUB132NEPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VFMSUB132BF16Z128rk, X86::VFMSUB132BF16Z128mbk, TB_BCAST_SH},
+ {X86::VFMSUB132BF16Z128rkz, X86::VFMSUB132BF16Z128mbkz, TB_BCAST_SH},
+ {X86::VFMSUB132BF16Z256rk, X86::VFMSUB132BF16Z256mbk, TB_BCAST_SH},
+ {X86::VFMSUB132BF16Z256rkz, X86::VFMSUB132BF16Z256mbkz, TB_BCAST_SH},
+ {X86::VFMSUB132BF16Zrk, X86::VFMSUB132BF16Zmbk, TB_BCAST_SH},
+ {X86::VFMSUB132BF16Zrkz, X86::VFMSUB132BF16Zmbkz, TB_BCAST_SH},
{X86::VFMSUB132PDZ128rk, X86::VFMSUB132PDZ128mbk, TB_BCAST_SD},
{X86::VFMSUB132PDZ128rkz, X86::VFMSUB132PDZ128mbkz, TB_BCAST_SD},
{X86::VFMSUB132PDZ256rk, X86::VFMSUB132PDZ256mbk, TB_BCAST_SD},
@@ -10017,12 +10017,12 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VFMSUB132PSZ256rkz, X86::VFMSUB132PSZ256mbkz, TB_BCAST_SS},
{X86::VFMSUB132PSZrk, X86::VFMSUB132PSZmbk, TB_BCAST_SS},
{X86::VFMSUB132PSZrkz, X86::VFMSUB132PSZmbkz, TB_BCAST_SS},
- {X86::VFMSUB213NEPBF16Z128rk, X86::VFMSUB213NEPBF16Z128mbk, TB_BCAST_SH},
- {X86::VFMSUB213NEPBF16Z128rkz, X86::VFMSUB213NEPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VFMSUB213NEPBF16Z256rk, X86::VFMSUB213NEPBF16Z256mbk, TB_BCAST_SH},
- {X86::VFMSUB213NEPBF16Z256rkz, X86::VFMSUB213NEPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VFMSUB213NEPBF16Zrk, X86::VFMSUB213NEPBF16Zmbk, TB_BCAST_SH},
- {X86::VFMSUB213NEPBF16Zrkz, X86::VFMSUB213NEPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VFMSUB213BF16Z128rk, X86::VFMSUB213BF16Z128mbk, TB_BCAST_SH},
+ {X86::VFMSUB213BF16Z128rkz, X86::VFMSUB213BF16Z128mbkz, TB_BCAST_SH},
+ {X86::VFMSUB213BF16Z256rk, X86::VFMSUB213BF16Z256mbk, TB_BCAST_SH},
+ {X86::VFMSUB213BF16Z256rkz, X86::VFMSUB213BF16Z256mbkz, TB_BCAST_SH},
+ {X86::VFMSUB213BF16Zrk, X86::VFMSUB213BF16Zmbk, TB_BCAST_SH},
+ {X86::VFMSUB213BF16Zrkz, X86::VFMSUB213BF16Zmbkz, TB_BCAST_SH},
{X86::VFMSUB213PDZ128rk, X86::VFMSUB213PDZ128mbk, TB_BCAST_SD},
{X86::VFMSUB213PDZ128rkz, X86::VFMSUB213PDZ128mbkz, TB_BCAST_SD},
{X86::VFMSUB213PDZ256rk, X86::VFMSUB213PDZ256mbk, TB_BCAST_SD},
@@ -10041,12 +10041,12 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VFMSUB213PSZ256rkz, X86::VFMSUB213PSZ256mbkz, TB_BCAST_SS},
{X86::VFMSUB213PSZrk, X86::VFMSUB213PSZmbk, TB_BCAST_SS},
{X86::VFMSUB213PSZrkz, X86::VFMSUB213PSZmbkz, TB_BCAST_SS},
- {X86::VFMSUB231NEPBF16Z128rk, X86::VFMSUB231NEPBF16Z128mbk, TB_BCAST_SH},
- {X86::VFMSUB231NEPBF16Z128rkz, X86::VFMSUB231NEPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VFMSUB231NEPBF16Z256rk, X86::VFMSUB231NEPBF16Z256mbk, TB_BCAST_SH},
- {X86::VFMSUB231NEPBF16Z256rkz, X86::VFMSUB231NEPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VFMSUB231NEPBF16Zrk, X86::VFMSUB231NEPBF16Zmbk, TB_BCAST_SH},
- {X86::VFMSUB231NEPBF16Zrkz, X86::VFMSUB231NEPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VFMSUB231BF16Z128rk, X86::VFMSUB231BF16Z128mbk, TB_BCAST_SH},
+ {X86::VFMSUB231BF16Z128rkz, X86::VFMSUB231BF16Z128mbkz, TB_BCAST_SH},
+ {X86::VFMSUB231BF16Z256rk, X86::VFMSUB231BF16Z256mbk, TB_BCAST_SH},
+ {X86::VFMSUB231BF16Z256rkz, X86::VFMSUB231BF16Z256mbkz, TB_BCAST_SH},
+ {X86::VFMSUB231BF16Zrk, X86::VFMSUB231BF16Zmbk, TB_BCAST_SH},
+ {X86::VFMSUB231BF16Zrkz, X86::VFMSUB231BF16Zmbkz, TB_BCAST_SH},
{X86::VFMSUB231PDZ128rk, X86::VFMSUB231PDZ128mbk, TB_BCAST_SD},
{X86::VFMSUB231PDZ128rkz, X86::VFMSUB231PDZ128mbkz, TB_BCAST_SD},
{X86::VFMSUB231PDZ256rk, X86::VFMSUB231PDZ256mbk, TB_BCAST_SD},
@@ -10122,12 +10122,12 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VFMULCPHZ128rrk, X86::VFMULCPHZ128rmbk, TB_BCAST_SS},
{X86::VFMULCPHZ256rrk, X86::VFMULCPHZ256rmbk, TB_BCAST_SS},
{X86::VFMULCPHZrrk, X86::VFMULCPHZrmbk, TB_BCAST_SS},
- {X86::VFNMADD132NEPBF16Z128rk, X86::VFNMADD132NEPBF16Z128mbk, TB_BCAST_SH},
- {X86::VFNMADD132NEPBF16Z128rkz, X86::VFNMADD132NEPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VFNMADD132NEPBF16Z256rk, X86::VFNMADD132NEPBF16Z256mbk, TB_BCAST_SH},
- {X86::VFNMADD132NEPBF16Z256rkz, X86::VFNMADD132NEPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VFNMADD132NEPBF16Zrk, X86::VFNMADD132NEPBF16Zmbk, TB_BCAST_SH},
- {X86::VFNMADD132NEPBF16Zrkz, X86::VFNMADD132NEPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VFNMADD132BF16Z128rk, X86::VFNMADD132BF16Z128mbk, TB_BCAST_SH},
+ {X86::VFNMADD132BF16Z128rkz, X86::VFNMADD132BF16Z128mbkz, TB_BCAST_SH},
+ {X86::VFNMADD132BF16Z256rk, X86::VFNMADD132BF16Z256mbk, TB_BCAST_SH},
+ {X86::VFNMADD132BF16Z256rkz, X86::VFNMADD132BF16Z256mbkz, TB_BCAST_SH},
+ {X86::VFNMADD132BF16Zrk, X86::VFNMADD132BF16Zmbk, TB_BCAST_SH},
+ {X86::VFNMADD132BF16Zrkz, X86::VFNMADD132BF16Zmbkz, TB_BCAST_SH},
{X86::VFNMADD132PDZ128rk, X86::VFNMADD132PDZ128mbk, TB_BCAST_SD},
{X86::VFNMADD132PDZ128rkz, X86::VFNMADD132PDZ128mbkz, TB_BCAST_SD},
{X86::VFNMADD132PDZ256rk, X86::VFNMADD132PDZ256mbk, TB_BCAST_SD},
@@ -10146,12 +10146,12 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VFNMADD132PSZ256rkz, X86::VFNMADD132PSZ256mbkz, TB_BCAST_SS},
{X86::VFNMADD132PSZrk, X86::VFNMADD132PSZmbk, TB_BCAST_SS},
{X86::VFNMADD132PSZrkz, X86::VFNMADD132PSZmbkz, TB_BCAST_SS},
- {X86::VFNMADD213NEPBF16Z128rk, X86::VFNMADD213NEPBF16Z128mbk, TB_BCAST_SH},
- {X86::VFNMADD213NEPBF16Z128rkz, X86::VFNMADD213NEPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VFNMADD213NEPBF16Z256rk, X86::VFNMADD213NEPBF16Z256mbk, TB_BCAST_SH},
- {X86::VFNMADD213NEPBF16Z256rkz, X86::VFNMADD213NEPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VFNMADD213NEPBF16Zrk, X86::VFNMADD213NEPBF16Zmbk, TB_BCAST_SH},
- {X86::VFNMADD213NEPBF16Zrkz, X86::VFNMADD213NEPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VFNMADD213BF16Z128rk, X86::VFNMADD213BF16Z128mbk, TB_BCAST_SH},
+ {X86::VFNMADD213BF16Z128rkz, X86::VFNMADD213BF16Z128mbkz, TB_BCAST_SH},
+ {X86::VFNMADD213BF16Z256rk, X86::VFNMADD213BF16Z256mbk, TB_BCAST_SH},
+ {X86::VFNMADD213BF16Z256rkz, X86::VFNMADD213BF16Z256mbkz, TB_BCAST_SH},
+ {X86::VFNMADD213BF16Zrk, X86::VFNMADD213BF16Zmbk, TB_BCAST_SH},
+ {X86::VFNMADD213BF16Zrkz, X86::VFNMADD213BF16Zmbkz, TB_BCAST_SH},
{X86::VFNMADD213PDZ128rk, X86::VFNMADD213PDZ128mbk, TB_BCAST_SD},
{X86::VFNMADD213PDZ128rkz, X86::VFNMADD213PDZ128mbkz, TB_BCAST_SD},
{X86::VFNMADD213PDZ256rk, X86::VFNMADD213PDZ256mbk, TB_BCAST_SD},
@@ -10170,12 +10170,12 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VFNMADD213PSZ256rkz, X86::VFNMADD213PSZ256mbkz, TB_BCAST_SS},
{X86::VFNMADD213PSZrk, X86::VFNMADD213PSZmbk, TB_BCAST_SS},
{X86::VFNMADD213PSZrkz, X86::VFNMADD213PSZmbkz, TB_BCAST_SS},
- {X86::VFNMADD231NEPBF16Z128rk, X86::VFNMADD231NEPBF16Z128mbk, TB_BCAST_SH},
- {X86::VFNMADD231NEPBF16Z128rkz, X86::VFNMADD231NEPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VFNMADD231NEPBF16Z256rk, X86::VFNMADD231NEPBF16Z256mbk, TB_BCAST_SH},
- {X86::VFNMADD231NEPBF16Z256rkz, X86::VFNMADD231NEPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VFNMADD231NEPBF16Zrk, X86::VFNMADD231NEPBF16Zmbk, TB_BCAST_SH},
- {X86::VFNMADD231NEPBF16Zrkz, X86::VFNMADD231NEPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VFNMADD231BF16Z128rk, X86::VFNMADD231BF16Z128mbk, TB_BCAST_SH},
+ {X86::VFNMADD231BF16Z128rkz, X86::VFNMADD231BF16Z128mbkz, TB_BCAST_SH},
+ {X86::VFNMADD231BF16Z256rk, X86::VFNMADD231BF16Z256mbk, TB_BCAST_SH},
+ {X86::VFNMADD231BF16Z256rkz, X86::VFNMADD231BF16Z256mbkz, TB_BCAST_SH},
+ {X86::VFNMADD231BF16Zrk, X86::VFNMADD231BF16Zmbk, TB_BCAST_SH},
+ {X86::VFNMADD231BF16Zrkz, X86::VFNMADD231BF16Zmbkz, TB_BCAST_SH},
{X86::VFNMADD231PDZ128rk, X86::VFNMADD231PDZ128mbk, TB_BCAST_SD},
{X86::VFNMADD231PDZ128rkz, X86::VFNMADD231PDZ128mbkz, TB_BCAST_SD},
{X86::VFNMADD231PDZ256rk, X86::VFNMADD231PDZ256mbk, TB_BCAST_SD},
@@ -10194,12 +10194,12 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VFNMADD231PSZ256rkz, X86::VFNMADD231PSZ256mbkz, TB_BCAST_SS},
{X86::VFNMADD231PSZrk, X86::VFNMADD231PSZmbk, TB_BCAST_SS},
{X86::VFNMADD231PSZrkz, X86::VFNMADD231PSZmbkz, TB_BCAST_SS},
- {X86::VFNMSUB132NEPBF16Z128rk, X86::VFNMSUB132NEPBF16Z128mbk, TB_BCAST_SH},
- {X86::VFNMSUB132NEPBF16Z128rkz, X86::VFNMSUB132NEPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VFNMSUB132NEPBF16Z256rk, X86::VFNMSUB132NEPBF16Z256mbk, TB_BCAST_SH},
- {X86::VFNMSUB132NEPBF16Z256rkz, X86::VFNMSUB132NEPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VFNMSUB132NEPBF16Zrk, X86::VFNMSUB132NEPBF16Zmbk, TB_BCAST_SH},
- {X86::VFNMSUB132NEPBF16Zrkz, X86::VFNMSUB132NEPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VFNMSUB132BF16Z128rk, X86::VFNMSUB132BF16Z128mbk, TB_BCAST_SH},
+ {X86::VFNMSUB132BF16Z128rkz, X86::VFNMSUB132BF16Z128mbkz, TB_BCAST_SH},
+ {X86::VFNMSUB132BF16Z256rk, X86::VFNMSUB132BF16Z256mbk, TB_BCAST_SH},
+ {X86::VFNMSUB132BF16Z256rkz, X86::VFNMSUB132BF16Z256mbkz, TB_BCAST_SH},
+ {X86::VFNMSUB132BF16Zrk, X86::VFNMSUB132BF16Zmbk, TB_BCAST_SH},
+ {X86::VFNMSUB132BF16Zrkz, X86::VFNMSUB132BF16Zmbkz, TB_BCAST_SH},
{X86::VFNMSUB132PDZ128rk, X86::VFNMSUB132PDZ128mbk, TB_BCAST_SD},
{X86::VFNMSUB132PDZ128rkz, X86::VFNMSUB132PDZ128mbkz, TB_BCAST_SD},
{X86::VFNMSUB132PDZ256rk, X86::VFNMSUB132PDZ256mbk, TB_BCAST_SD},
@@ -10218,12 +10218,12 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VFNMSUB132PSZ256rkz, X86::VFNMSUB132PSZ256mbkz, TB_BCAST_SS},
{X86::VFNMSUB132PSZrk, X86::VFNMSUB132PSZmbk, TB_BCAST_SS},
{X86::VFNMSUB132PSZrkz, X86::VFNMSUB132PSZmbkz, TB_BCAST_SS},
- {X86::VFNMSUB213NEPBF16Z128rk, X86::VFNMSUB213NEPBF16Z128mbk, TB_BCAST_SH},
- {X86::VFNMSUB213NEPBF16Z128rkz, X86::VFNMSUB213NEPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VFNMSUB213NEPBF16Z256rk, X86::VFNMSUB213NEPBF16Z256mbk, TB_BCAST_SH},
- {X86::VFNMSUB213NEPBF16Z256rkz, X86::VFNMSUB213NEPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VFNMSUB213NEPBF16Zrk, X86::VFNMSUB213NEPBF16Zmbk, TB_BCAST_SH},
- {X86::VFNMSUB213NEPBF16Zrkz, X86::VFNMSUB213NEPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VFNMSUB213BF16Z128rk, X86::VFNMSUB213BF16Z128mbk, TB_BCAST_SH},
+ {X86::VFNMSUB213BF16Z128rkz, X86::VFNMSUB213BF16Z128mbkz, TB_BCAST_SH},
+ {X86::VFNMSUB213BF16Z256rk, X86::VFNMSUB213BF16Z256mbk, TB_BCAST_SH},
+ {X86::VFNMSUB213BF16Z256rkz, X86::VFNMSUB213BF16Z256mbkz, TB_BCAST_SH},
+ {X86::VFNMSUB213BF16Zrk, X86::VFNMSUB213BF16Zmbk, TB_BCAST_SH},
+ {X86::VFNMSUB213BF16Zrkz, X86::VFNMSUB213BF16Zmbkz, TB_BCAST_SH},
{X86::VFNMSUB213PDZ128rk, X86::VFNMSUB213PDZ128mbk, TB_BCAST_SD},
{X86::VFNMSUB213PDZ128rkz, X86::VFNMSUB213PDZ128mbkz, TB_BCAST_SD},
{X86::VFNMSUB213PDZ256rk, X86::VFNMSUB213PDZ256mbk, TB_BCAST_SD},
@@ -10242,12 +10242,12 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VFNMSUB213PSZ256rkz, X86::VFNMSUB213PSZ256mbkz, TB_BCAST_SS},
{X86::VFNMSUB213PSZrk, X86::VFNMSUB213PSZmbk, TB_BCAST_SS},
{X86::VFNMSUB213PSZrkz, X86::VFNMSUB213PSZmbkz, TB_BCAST_SS},
- {X86::VFNMSUB231NEPBF16Z128rk, X86::VFNMSUB231NEPBF16Z128mbk, TB_BCAST_SH},
- {X86::VFNMSUB231NEPBF16Z128rkz, X86::VFNMSUB231NEPBF16Z128mbkz, TB_BCAST_SH},
- {X86::VFNMSUB231NEPBF16Z256rk, X86::VFNMSUB231NEPBF16Z256mbk, TB_BCAST_SH},
- {X86::VFNMSUB231NEPBF16Z256rkz, X86::VFNMSUB231NEPBF16Z256mbkz, TB_BCAST_SH},
- {X86::VFNMSUB231NEPBF16Zrk, X86::VFNMSUB231NEPBF16Zmbk, TB_BCAST_SH},
- {X86::VFNMSUB231NEPBF16Zrkz, X86::VFNMSUB231NEPBF16Zmbkz, TB_BCAST_SH},
+ {X86::VFNMSUB231BF16Z128rk, X86::VFNMSUB231BF16Z128mbk, TB_BCAST_SH},
+ {X86::VFNMSUB231BF16Z128rkz, X86::VFNMSUB231BF16Z128mbkz, TB_BCAST_SH},
+ {X86::VFNMSUB231BF16Z256rk, X86::VFNMSUB231BF16Z256mbk, TB_BCAST_SH},
+ {X86::VFNMSUB231BF16Z256rkz, X86::VFNMSUB231BF16Z256mbkz, TB_BCAST_SH},
+ {X86::VFNMSUB231BF16Zrk, X86::VFNMSUB231BF16Zmbk, TB_BCAST_SH},
+ {X86::VFNMSUB231BF16Zrkz, X86::VFNMSUB231BF16Zmbkz, TB_BCAST_SH},
{X86::VFNMSUB231PDZ128rk, X86::VFNMSUB231PDZ128mbk, TB_BCAST_SD},
{X86::VFNMSUB231PDZ128rkz, X86::VFNMSUB231PDZ128mbkz, TB_BCAST_SD},
{X86::VFNMSUB231PDZ256rk, X86::VFNMSUB231PDZ256mbk, TB_BCAST_SD},
@@ -10272,6 +10272,9 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VGF2P8AFFINEQBZ128rrik, X86::VGF2P8AFFINEQBZ128rmbik, TB_BCAST_Q},
{X86::VGF2P8AFFINEQBZ256rrik, X86::VGF2P8AFFINEQBZ256rmbik, TB_BCAST_Q},
{X86::VGF2P8AFFINEQBZrrik, X86::VGF2P8AFFINEQBZrmbik, TB_BCAST_Q},
+ {X86::VMAXBF16Z128rrk, X86::VMAXBF16Z128rmbk, TB_BCAST_SH},
+ {X86::VMAXBF16Z256rrk, X86::VMAXBF16Z256rmbk, TB_BCAST_SH},
+ {X86::VMAXBF16Zrrk, X86::VMAXBF16Zrmbk, TB_BCAST_SH},
{X86::VMAXCPDZ128rrk, X86::VMAXCPDZ128rmbk, TB_BCAST_SD},
{X86::VMAXCPDZ256rrk, X86::VMAXCPDZ256rmbk, TB_BCAST_SD},
{X86::VMAXCPDZrrk, X86::VMAXCPDZrmbk, TB_BCAST_SD},
@@ -10281,9 +10284,6 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VMAXCPSZ128rrk, X86::VMAXCPSZ128rmbk, TB_BCAST_SS},
{X86::VMAXCPSZ256rrk, X86::VMAXCPSZ256rmbk, TB_BCAST_SS},
{X86::VMAXCPSZrrk, X86::VMAXCPSZrmbk, TB_BCAST_SS},
- {X86::VMAXPBF16Z128rrk, X86::VMAXPBF16Z128rmbk, TB_BCAST_SH},
- {X86::VMAXPBF16Z256rrk, X86::VMAXPBF16Z256rmbk, TB_BCAST_SH},
- {X86::VMAXPBF16Zrrk, X86::VMAXPBF16Zrmbk, TB_BCAST_SH},
{X86::VMAXPDZ128rrk, X86::VMAXPDZ128rmbk, TB_BCAST_SD},
{X86::VMAXPDZ256rrk, X86::VMAXPDZ256rmbk, TB_BCAST_SD},
{X86::VMAXPDZrrk, X86::VMAXPDZrmbk, TB_BCAST_SD},
@@ -10293,6 +10293,9 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VMAXPSZ128rrk, X86::VMAXPSZ128rmbk, TB_BCAST_SS},
{X86::VMAXPSZ256rrk, X86::VMAXPSZ256rmbk, TB_BCAST_SS},
{X86::VMAXPSZrrk, X86::VMAXPSZrmbk, TB_BCAST_SS},
+ {X86::VMINBF16Z128rrk, X86::VMINBF16Z128rmbk, TB_BCAST_SH},
+ {X86::VMINBF16Z256rrk, X86::VMINBF16Z256rmbk, TB_BCAST_SH},
+ {X86::VMINBF16Zrrk, X86::VMINBF16Zrmbk, TB_BCAST_SH},
{X86::VMINCPDZ128rrk, X86::VMINCPDZ128rmbk, TB_BCAST_SD},
{X86::VMINCPDZ256rrk, X86::VMINCPDZ256rmbk, TB_BCAST_SD},
{X86::VMINCPDZrrk, X86::VMINCPDZrmbk, TB_BCAST_SD},
@@ -10314,9 +10317,6 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VMINMAXPSZ128rrik, X86::VMINMAXPSZ128rmbik, TB_BCAST_SS},
{X86::VMINMAXPSZ256rrik, X86::VMINMAXPSZ256rmbik, TB_BCAST_SS},
{X86::VMINMAXPSZrrik, X86::VMINMAXPSZrmbik, TB_BCAST_SS},
- {X86::VMINPBF16Z128rrk, X86::VMINPBF16Z128rmbk, TB_BCAST_SH},
- {X86::VMINPBF16Z256rrk, X86::VMINPBF16Z256rmbk, TB_BCAST_SH},
- {X86::VMINPBF16Zrrk, X86::VMINPBF16Zrmbk, TB_BCAST_SH},
{X86::VMINPDZ128rrk, X86::VMINPDZ128rmbk, TB_BCAST_SD},
{X86::VMINPDZ256rrk, X86::VMINPDZ256rmbk, TB_BCAST_SD},
{X86::VMINPDZrrk, X86::VMINPDZrmbk, TB_BCAST_SD},
@@ -10326,9 +10326,9 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VMINPSZ128rrk, X86::VMINPSZ128rmbk, TB_BCAST_SS},
{X86::VMINPSZ256rrk, X86::VMINPSZ256rmbk, TB_BCAST_SS},
{X86::VMINPSZrrk, X86::VMINPSZrmbk, TB_BCAST_SS},
- {X86::VMULNEPBF16Z128rrk, X86::VMULNEPBF16Z128rmbk, TB_BCAST_SH},
- {X86::VMULNEPBF16Z256rrk, X86::VMULNEPBF16Z256rmbk, TB_BCAST_SH},
- {X86::VMULNEPBF16Zrrk, X86::VMULNEPBF16Zrmbk, TB_BCAST_SH},
+ {X86::VMULBF16Z128rrk, X86::VMULBF16Z128rmbk, TB_BCAST_SH},
+ {X86::VMULBF16Z256rrk, X86::VMULBF16Z256rmbk, TB_BCAST_SH},
+ {X86::VMULBF16Zrrk, X86::VMULBF16Zrmbk, TB_BCAST_SH},
{X86::VMULPDZ128rrk, X86::VMULPDZ128rmbk, TB_BCAST_SD},
{X86::VMULPDZ256rrk, X86::VMULPDZ256rmbk, TB_BCAST_SD},
{X86::VMULPDZrrk, X86::VMULPDZrmbk, TB_BCAST_SD},
@@ -10691,9 +10691,9 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VRANGEPSZ128rrik, X86::VRANGEPSZ128rmbik, TB_BCAST_SS},
{X86::VRANGEPSZ256rrik, X86::VRANGEPSZ256rmbik, TB_BCAST_SS},
{X86::VRANGEPSZrrik, X86::VRANGEPSZrmbik, TB_BCAST_SS},
- {X86::VSCALEFPBF16Z128rrk, X86::VSCALEFPBF16Z128rmbk, TB_BCAST_SH},
- {X86::VSCALEFPBF16Z256rrk, X86::VSCALEFPBF16Z256rmbk, TB_BCAST_SH},
- {X86::VSCALEFPBF16Zrrk, X86::VSCALEFPBF16Zrmbk, TB_BCAST_SH},
+ {X86::VSCALEFBF16Z128rrk, X86::VSCALEFBF16Z128rmbk, TB_BCAST_SH},
+ {X86::VSCALEFBF16Z256rrk, X86::VSCALEFBF16Z256rmbk, TB_BCAST_SH},
+ {X86::VSCALEFBF16Zrrk, X86::VSCALEFBF16Zrmbk, TB_BCAST_SH},
{X86::VSCALEFPDZ128rrk, X86::VSCALEFPDZ128rmbk, TB_BCAST_SD},
{X86::VSCALEFPDZ256rrk, X86::VSCALEFPDZ256rmbk, TB_BCAST_SD},
{X86::VSCALEFPDZrrk, X86::VSCALEFPDZrmbk, TB_BCAST_SD},
@@ -10717,9 +10717,9 @@ static const X86FoldTableEntry BroadcastTable4[] = {
{X86::VSHUFPSZ128rrik, X86::VSHUFPSZ128rmbik, TB_BCAST_SS},
{X86::VSHUFPSZ256rrik, X86::VSHUFPSZ256rmbik, TB_BCAST_SS},
{X86::VSHUFPSZrrik, X86::VSHUFPSZrmbik, TB_BCAST_SS},
- {X86::VSUBNEPBF16Z128rrk, X86::VSUBNEPBF16Z128rmbk, TB_BCAST_SH},
- {X86::VSUBNEPBF16Z256rrk, X86::VSUBNEPBF16Z256rmbk, TB_BCAST_SH},
- {X86::VSUBNEPBF16Zrrk, X86::VSUBNEPBF16Zrmbk, TB_BCAST_SH},
+ {X86::VSUBBF16Z128rrk, X86::VSUBBF16Z128rmbk, TB_BCAST_SH},
+ {X86::VSUBBF16Z256rrk, X86::VSUBBF16Z256rmbk, TB_BCAST_SH},
+ {X86::VSUBBF16Zrrk, X86::VSUBBF16Zrmbk, TB_BCAST_SH},
{X86::VSUBPDZ128rrk, X86::VSUBPDZ128rmbk, TB_BCAST_SD},
{X86::VSUBPDZ256rrk, X86::VSUBPDZ256rmbk, TB_BCAST_SD},
{X86::VSUBPDZrrk, X86::VSUBPDZrmbk, TB_BCAST_SD},
More information about the llvm-commits
mailing list