[llvm] [AMDGCN] Allow unscheduling of bundled insns (PR #129769)
Matt Arsenault via llvm-commits
llvm-commits at lists.llvm.org
Thu Mar 6 17:29:51 PST 2025
================
@@ -0,0 +1,28 @@
+; REQUIRES: asserts
+; RUN: llc -mtriple=amdgcn -O1 -mcpu=gfx90a -debug-only=machine-scheduler -stop-after=machine-scheduler < %s 2>%t | FileCheck %s
+; RUN: FileCheck --check-prefix=DEBUG %s < %t
+
+; DEBUG: Attempting to revert scheduling.
+
+; CHECK: BUNDLE implicit $m0, implicit $exec {
+; CHECK-NEXT: DS_GWS_SEMA_V 0, implicit $m0, implicit $exec :: (store (s32) into custom "GWSResource")
+; CHECK-NEXT: S_WAITCNT 0
+; CHECK-NEXT: }
+
+ at G = global <32 x i8> splat (i8 1)
+ at G.1 = global <32 x i8> splat (i8 127)
+
+define amdgpu_kernel void @gws_sema_v_offset0(i32 %val) #0 {
+ %LGV1 = load <32 x i8>, ptr @G.1, align 32
+ %LGV = load <32 x i8>, ptr @G, align 32
+ call void @llvm.amdgcn.ds.gws.sema.v(i32 0)
+ %C = icmp ne <32 x i8> %LGV, %LGV1
+ store <32 x i1> %C, ptr poison, align 4
+ ret void
+}
+
+declare void @llvm.amdgcn.ds.gws.sema.v(i32) #1
+
+attributes #0 = { convergent nounwind memory(inaccessiblemem: readwrite) }
+attributes #1 = { convergent nocallback nofree nounwind willreturn memory(inaccessiblemem: readwrite) }
+
----------------
arsenm wrote:
```suggestion
```
https://github.com/llvm/llvm-project/pull/129769
More information about the llvm-commits
mailing list