[PATCH] D18137: AMDGPU: Prevent uniform loops from becoming infinite
Phabricator via llvm-commits
llvm-commits at lists.llvm.org
Wed Mar 16 13:19:31 PDT 2016
This revision was automatically updated to reflect the committed changes.
Closed by commit rL263658: AMDGPU: Prevent uniform loops from becoming infinite (authored by nha).
Changed prior to commit:
http://reviews.llvm.org/D18137?vs=50560&id=50853#toc
Repository:
rL LLVM
http://reviews.llvm.org/D18137
Files:
llvm/trunk/lib/Target/AMDGPU/SILowerControlFlow.cpp
llvm/trunk/test/CodeGen/AMDGPU/uniform-loop-inside-nonuniform.ll
Index: llvm/trunk/test/CodeGen/AMDGPU/uniform-loop-inside-nonuniform.ll
===================================================================
--- llvm/trunk/test/CodeGen/AMDGPU/uniform-loop-inside-nonuniform.ll
+++ llvm/trunk/test/CodeGen/AMDGPU/uniform-loop-inside-nonuniform.ll
@@ -0,0 +1,28 @@
+;RUN: llc -march=amdgcn -mcpu=verde < %s | FileCheck %s --check-prefix=CHECK
+
+; Test a simple uniform loop that lives inside non-uniform control flow.
+
+;CHECK-LABEL: {{^}}test1:
+;CHECK: s_cbranch_execz
+;CHECK: %loop_body
+define void @test1(<8 x i32> inreg %rsrc, <2 x i32> %addr.base, i32 %y, i32 %p) #0 {
+main_body:
+ %cc = icmp eq i32 %p, 0
+ br i1 %cc, label %out, label %loop_body
+
+loop_body:
+ %counter = phi i32 [ 0, %main_body ], [ %incr, %loop_body ]
+
+ ; Prevent the loop from being optimized out
+ call void asm sideeffect "", "" ()
+
+ %incr = add i32 %counter, 1
+ %lc = icmp sge i32 %incr, 1000
+ br i1 %lc, label %out, label %loop_body
+
+out:
+ ret void
+}
+
+attributes #0 = { "ShaderType"="0" }
+attributes #1 = { nounwind readonly }
Index: llvm/trunk/lib/Target/AMDGPU/SILowerControlFlow.cpp
===================================================================
--- llvm/trunk/lib/Target/AMDGPU/SILowerControlFlow.cpp
+++ llvm/trunk/lib/Target/AMDGPU/SILowerControlFlow.cpp
@@ -137,6 +137,12 @@
NumInstr < SkipThreshold && I != E; ++I) {
if (I->isBundle() || !I->isBundled())
+ // When a uniform loop is inside non-uniform control flow, the branch
+ // leaving the loop might be an S_CBRANCH_VCCNZ, which is never taken
+ // when EXEC = 0. We should skip the loop lest it becomes infinite.
+ if (I->getOpcode() == AMDGPU::S_CBRANCH_VCCNZ)
+ return true;
+
if (++NumInstr >= SkipThreshold)
return true;
}
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D18137.50853.patch
Type: text/x-patch
Size: 1817 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/llvm-commits/attachments/20160316/97c3c371/attachment.bin>
More information about the llvm-commits
mailing list