[llvm] 70e2d63 - [AMDGPU] Consistently use v2i16 for packed bf16 inputs. NFC.
Jay Foad via llvm-commits
llvm-commits at lists.llvm.org
Wed Mar 29 12:33:38 PDT 2023
Author: Jay Foad
Date: 2023-03-29T20:23:36+01:00
New Revision: 70e2d631e178fbf5cfcd45d8af43bfcad24db744
URL: https://github.com/llvm/llvm-project/commit/70e2d631e178fbf5cfcd45d8af43bfcad24db744
DIFF: https://github.com/llvm/llvm-project/commit/70e2d631e178fbf5cfcd45d8af43bfcad24db744.diff
LOG: [AMDGPU] Consistently use v2i16 for packed bf16 inputs. NFC.
Differential Revision: https://reviews.llvm.org/D147145
Added:
Modified:
llvm/lib/Target/AMDGPU/FLATInstructions.td
Removed:
################################################################################
diff --git a/llvm/lib/Target/AMDGPU/FLATInstructions.td b/llvm/lib/Target/AMDGPU/FLATInstructions.td
index 2782fac6a8fe7..5c86d80e7dd2b 100644
--- a/llvm/lib/Target/AMDGPU/FLATInstructions.td
+++ b/llvm/lib/Target/AMDGPU/FLATInstructions.td
@@ -732,11 +732,12 @@ let SubtargetPredicate = isGFX90APlus in {
let SubtargetPredicate = HasAtomicFlatPkAdd16Insts in {
defm FLAT_ATOMIC_PK_ADD_F16 : FLAT_Atomic_Pseudo<"flat_atomic_pk_add_f16", VGPR_32, v2f16>;
- defm FLAT_ATOMIC_PK_ADD_BF16 : FLAT_Atomic_Pseudo<"flat_atomic_pk_add_bf16", VGPR_32, v2f16>;
+ let FPAtomic = 1 in
+ defm FLAT_ATOMIC_PK_ADD_BF16 : FLAT_Atomic_Pseudo<"flat_atomic_pk_add_bf16", VGPR_32, v2i16>;
} // End SubtargetPredicate = HasAtomicFlatPkAdd16Insts
-let SubtargetPredicate = HasAtomicGlobalPkAddBF16Inst in
- defm GLOBAL_ATOMIC_PK_ADD_BF16 : FLAT_Global_Atomic_Pseudo<"global_atomic_pk_add_bf16", VGPR_32, v2f16>;
+let SubtargetPredicate = HasAtomicGlobalPkAddBF16Inst, FPAtomic = 1 in
+ defm GLOBAL_ATOMIC_PK_ADD_BF16 : FLAT_Global_Atomic_Pseudo<"global_atomic_pk_add_bf16", VGPR_32, v2i16>;
// GFX7-, GFX10-, GFX11-only flat instructions.
let SubtargetPredicate = isGFX7GFX10GFX11 in {
More information about the llvm-commits
mailing list