[PATCH] D66932: [LV] Tail-folding, runtime scev checks

Sjoerd Meijer via Phabricator via llvm-commits llvm-commits at lists.llvm.org
Thu Aug 29 02:39:15 PDT 2019


SjoerdMeijer created this revision.
SjoerdMeijer added reviewers: Ayal, dorit, hsaito, fhahn.
Herald added subscribers: rkruppe, hiraditya.
Herald added a project: LLVM.

Now that we allow tail-folding, not only when we optimise for size, make
sure we do not run in this assert.


https://reviews.llvm.org/D66932

Files:
  llvm/lib/Transforms/Vectorize/LoopVectorize.cpp
  llvm/test/Transforms/LoopVectorize/X86/tail-folding-scevcheck.ll


Index: llvm/test/Transforms/LoopVectorize/X86/tail-folding-scevcheck.ll
===================================================================
--- /dev/null
+++ llvm/test/Transforms/LoopVectorize/X86/tail-folding-scevcheck.ll
@@ -0,0 +1,46 @@
+; RUN: opt < %s  -loop-vectorize -mcpu=core-avx2 -S | FileCheck %s
+
+target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
+target triple = "x86_64-unknown-linux-gnu"
+
+ at a = external dso_local local_unnamed_addr global [1024 x i32], align 16
+
+define dso_local void @_Z5doit4ic(i32 %n, i8 signext %cstep) local_unnamed_addr #0 {
+; CHECK-LABEL: @_Z5doit4ic
+; CHECK:       vector.scevcheck:
+; CHECK:       vector.ph:
+; CHECK:       vector.body:
+entry:
+  %conv = sext i8 %cstep to i32
+  %cmp9 = icmp sgt i32 %n, 0
+  br i1 %cmp9, label %for.body.preheader, label %for.end
+
+for.body.preheader:
+  %wide.trip.count = zext i32 %n to i64
+  br label %for.body
+
+for.body:
+  %indvars.iv = phi i64 [ 0, %for.body.preheader ], [ %indvars.iv.next, %for.body ]
+  %p.010 = phi i32 [ 0, %for.body.preheader ], [ %add, %for.body ]
+  %sext = shl i32 %p.010, 24
+  %conv1 = ashr exact i32 %sext, 24
+  %arrayidx = getelementptr inbounds [1024 x i32], [1024 x i32]* @a, i64 0, i64 %indvars.iv
+  store i32 %conv1, i32* %arrayidx, align 4
+  %add = add nsw i32 %conv1, %conv
+  %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
+  %exitcond = icmp eq i64 %indvars.iv.next, %wide.trip.count
+  br i1 %exitcond, label %for.end.loopexit, label %for.body, !llvm.loop !6
+
+for.end.loopexit:
+  br label %for.end
+
+for.end:
+  ret void
+}
+
+attributes #0 = { nofree norecurse nounwind uwtable }
+
+!6 = distinct !{!6, !7, !8}
+!7 = !{!"llvm.loop.vectorize.predicate.enable", i1 true}
+!8 = !{!"llvm.loop.vectorize.enable", i1 true}
+
Index: llvm/lib/Transforms/Vectorize/LoopVectorize.cpp
===================================================================
--- llvm/lib/Transforms/Vectorize/LoopVectorize.cpp
+++ llvm/lib/Transforms/Vectorize/LoopVectorize.cpp
@@ -2695,9 +2695,7 @@
     if (C->isZero())
       return;
 
-  // FIXME: FoldTailByMasking no longer implies OptForSize, this should be
-  // checking CM_ScalarEpilogueNotAllowedOptSize
-  assert(!Cost->foldTailByMasking() &&
+  assert(!BB->getParent()->hasOptSize() &&
          "Cannot SCEV check stride or overflow when folding tail");
 
   // Create a new block containing the stride check.


-------------- next part --------------
A non-text attachment was scrubbed...
Name: D66932.217805.patch
Type: text/x-patch
Size: 2398 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/llvm-commits/attachments/20190829/4c95bcf2/attachment.bin>


More information about the llvm-commits mailing list