[PATCH] D18197: AMDGPU/SI: Do not generate s_waitcnt for ds_permute/ds_bpermute Instructions.
Phabricator via llvm-commits
llvm-commits at lists.llvm.org
Thu Mar 17 09:49:00 PDT 2016
This revision was automatically updated to reflect the committed changes.
Closed by commit rL263720: AMDGPU/SI: Do not generate s_waitcnt after ds_permute/ds_bpermute (authored by chfang).
Changed prior to commit:
http://reviews.llvm.org/D18197?vs=50888&id=50947#toc
Repository:
rL LLVM
http://reviews.llvm.org/D18197
Files:
llvm/trunk/lib/Target/AMDGPU/SIInstrInfo.td
llvm/trunk/test/CodeGen/AMDGPU/llvm.amdgcn.ds.bpermute.ll
llvm/trunk/test/CodeGen/AMDGPU/llvm.amdgcn.ds.permute.ll
Index: llvm/trunk/lib/Target/AMDGPU/SIInstrInfo.td
===================================================================
--- llvm/trunk/lib/Target/AMDGPU/SIInstrInfo.td
+++ llvm/trunk/lib/Target/AMDGPU/SIInstrInfo.td
@@ -2519,7 +2519,7 @@
dag ins = (ins VGPR_32:$addr, rc:$data0),
string asm = opName#" $vdst, $addr, $data0"> {
- let mayLoad = 0, mayStore = 0, isConvergent = 1 in {
+ let LGKM_CNT = 0, mayLoad = 0, mayStore = 0, isConvergent = 1 in {
def "" : DS_Pseudo <opName, outs, ins,
[(set (i32 rc:$vdst),
(node (i32 VGPR_32:$addr), (i32 rc:$data0)))]>;
Index: llvm/trunk/test/CodeGen/AMDGPU/llvm.amdgcn.ds.bpermute.ll
===================================================================
--- llvm/trunk/test/CodeGen/AMDGPU/llvm.amdgcn.ds.bpermute.ll
+++ llvm/trunk/test/CodeGen/AMDGPU/llvm.amdgcn.ds.bpermute.ll
@@ -10,4 +10,28 @@
ret void
}
+; FUNC-LABEL: {{^}}bpermute_no_waitcnt_test:
+; CHECK: s_cbranch_scc1
+; CHECK: ds_bpermute_b32 v{{[0-9]+}}, v{{[0-9]+}}, v{{[0-9]+}}
+; CHECK-NOT: s_waitcnt
+define void @bpermute_no_waitcnt_test(i32 addrspace(1)* %out, i32 %cond) {
+entry:
+
+ %tmp = icmp eq i32 %cond, 0
+ br i1 %tmp, label %if, label %else
+
+if: ; preds = %entry
+
+ %bpermute = call i32 @llvm.amdgcn.ds.bpermute(i32 0, i32 0) #0
+ br label %endif
+
+else: ; preds = %entry
+ br label %endif
+
+endif:
+ %val = phi i32 [ %bpermute, %if ], [0, %else] ; preds = %else, %if
+ store i32 %val, i32 addrspace(1)* %out, align 4
+ ret void
+}
+
attributes #0 = { nounwind readnone convergent }
Index: llvm/trunk/test/CodeGen/AMDGPU/llvm.amdgcn.ds.permute.ll
===================================================================
--- llvm/trunk/test/CodeGen/AMDGPU/llvm.amdgcn.ds.permute.ll
+++ llvm/trunk/test/CodeGen/AMDGPU/llvm.amdgcn.ds.permute.ll
@@ -5,9 +5,33 @@
; FUNC-LABEL: {{^}}ds_permute:
; CHECK: ds_permute_b32 v{{[0-9]+}}, v{{[0-9]+}}, v{{[0-9]+}}
define void @ds_permute(i32 addrspace(1)* %out, i32 %index, i32 %src) nounwind {
- %bpermute = call i32 @llvm.amdgcn.ds.permute(i32 %index, i32 %src) #0
- store i32 %bpermute, i32 addrspace(1)* %out, align 4
+ %permute = call i32 @llvm.amdgcn.ds.permute(i32 %index, i32 %src) #0
+ store i32 %permute, i32 addrspace(1)* %out, align 4
ret void
}
+; FUNC-LABEL: {{^}}permute_no_waitcnt_test:
+; CHECK: s_cbranch_scc1
+; CHECK: ds_permute_b32 v{{[0-9]+}}, v{{[0-9]+}}, v{{[0-9]+}}
+; CHECK-NOT: s_waitcnt
+define void @permute_no_waitcnt_test(i32 addrspace(1)* %out, i32 %cond) {
+entry:
+
+ %tmp = icmp eq i32 %cond, 0
+ br i1 %tmp, label %if, label %else
+
+if: ; preds = %entry
+ %permute = call i32 @llvm.amdgcn.ds.permute(i32 0, i32 0) #0
+ br label %endif
+
+else: ; preds = %entry
+ br label %endif
+
+endif:
+ %val = phi i32 [ %permute, %if ], [0, %else] ; preds = %else, %if
+ store i32 %val, i32 addrspace(1)* %out, align 4
+ ret void
+}
+
+
attributes #0 = { nounwind readnone convergent }
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D18197.50947.patch
Type: text/x-patch
Size: 3124 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/llvm-commits/attachments/20160317/203ff389/attachment.bin>
More information about the llvm-commits
mailing list