[llvm] 70e2d63 - [AMDGPU] Consistently use v2i16 for packed bf16 inputs. NFC.

Jay Foad via llvm-commits llvm-commits at lists.llvm.org
Wed Mar 29 12:33:38 PDT 2023


Author: Jay Foad
Date: 2023-03-29T20:23:36+01:00
New Revision: 70e2d631e178fbf5cfcd45d8af43bfcad24db744

URL: https://github.com/llvm/llvm-project/commit/70e2d631e178fbf5cfcd45d8af43bfcad24db744
DIFF: https://github.com/llvm/llvm-project/commit/70e2d631e178fbf5cfcd45d8af43bfcad24db744.diff

LOG: [AMDGPU] Consistently use v2i16 for packed bf16 inputs. NFC.

Differential Revision: https://reviews.llvm.org/D147145

Added: 
    

Modified: 
    llvm/lib/Target/AMDGPU/FLATInstructions.td

Removed: 
    


################################################################################
diff  --git a/llvm/lib/Target/AMDGPU/FLATInstructions.td b/llvm/lib/Target/AMDGPU/FLATInstructions.td
index 2782fac6a8fe7..5c86d80e7dd2b 100644
--- a/llvm/lib/Target/AMDGPU/FLATInstructions.td
+++ b/llvm/lib/Target/AMDGPU/FLATInstructions.td
@@ -732,11 +732,12 @@ let SubtargetPredicate = isGFX90APlus in {
 
 let SubtargetPredicate = HasAtomicFlatPkAdd16Insts in {
   defm FLAT_ATOMIC_PK_ADD_F16    : FLAT_Atomic_Pseudo<"flat_atomic_pk_add_f16",  VGPR_32, v2f16>;
-  defm FLAT_ATOMIC_PK_ADD_BF16   : FLAT_Atomic_Pseudo<"flat_atomic_pk_add_bf16", VGPR_32, v2f16>;
+  let FPAtomic = 1 in
+    defm FLAT_ATOMIC_PK_ADD_BF16   : FLAT_Atomic_Pseudo<"flat_atomic_pk_add_bf16", VGPR_32, v2i16>;
 } // End SubtargetPredicate = HasAtomicFlatPkAdd16Insts
 
-let SubtargetPredicate = HasAtomicGlobalPkAddBF16Inst in
-  defm GLOBAL_ATOMIC_PK_ADD_BF16 : FLAT_Global_Atomic_Pseudo<"global_atomic_pk_add_bf16", VGPR_32, v2f16>;
+let SubtargetPredicate = HasAtomicGlobalPkAddBF16Inst, FPAtomic = 1 in
+  defm GLOBAL_ATOMIC_PK_ADD_BF16 : FLAT_Global_Atomic_Pseudo<"global_atomic_pk_add_bf16", VGPR_32, v2i16>;
 
 // GFX7-, GFX10-, GFX11-only flat instructions.
 let SubtargetPredicate = isGFX7GFX10GFX11 in {


        


More information about the llvm-commits mailing list