[llvm] r340446 - [ARM] Handle all-ones mask explicitly in targetShrinkDemandedConstant.

Eli Friedman via llvm-commits llvm-commits at lists.llvm.org
Wed Aug 22 13:13:46 PDT 2018


Author: efriedma
Date: Wed Aug 22 13:13:45 2018
New Revision: 340446

URL: http://llvm.org/viewvc/llvm-project?rev=340446&view=rev
Log:
[ARM] Handle all-ones mask explicitly in targetShrinkDemandedConstant.

This avoids a potential infinite loop setting and unsetting bits in the
mask.

Reduced from a failure on the polly-aosp bot.

Differential Revision: https://reviews.llvm.org/D51066


Added:
    llvm/trunk/test/CodeGen/ARM/demanded-bits-and.ll
Modified:
    llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp

Modified: llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp?rev=340446&r1=340445&r2=340446&view=diff
==============================================================================
--- llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp (original)
+++ llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp Wed Aug 22 13:13:45 2018
@@ -13647,14 +13647,21 @@ ARMTargetLowering::targetShrinkDemandedC
 
   unsigned Mask = C->getZExtValue();
 
-  // If mask is zero, nothing to do.
-  if (!Mask)
-    return false;
-
   unsigned Demanded = DemandedAPInt.getZExtValue();
   unsigned ShrunkMask = Mask & Demanded;
   unsigned ExpandedMask = Mask | ~Demanded;
 
+  // If the mask is all zeros, let the target-independent code replace the
+  // result with zero.
+  if (ShrunkMask == 0)
+    return false;
+
+  // If the mask is all ones, erase the AND. (Currently, the target-independent
+  // code won't do this, so we have to do it explicitly to avoid an infinite
+  // loop in obscure cases.)
+  if (ExpandedMask == ~0U)
+    return TLO.CombineTo(Op, Op.getOperand(0));
+
   auto IsLegalMask = [ShrunkMask, ExpandedMask](unsigned Mask) -> bool {
     return (ShrunkMask & Mask) == ShrunkMask && (~ExpandedMask & Mask) == 0;
   };

Added: llvm/trunk/test/CodeGen/ARM/demanded-bits-and.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/ARM/demanded-bits-and.ll?rev=340446&view=auto
==============================================================================
--- llvm/trunk/test/CodeGen/ARM/demanded-bits-and.ll (added)
+++ llvm/trunk/test/CodeGen/ARM/demanded-bits-and.ll Wed Aug 22 13:13:45 2018
@@ -0,0 +1,35 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
+; RUN: llc -mtriple=arm-eabi < %s | FileCheck %s
+
+; Make sure this doesn't hang, and there are no unnecessary
+; "and" instructions.
+
+define dso_local void @f(i16* %p) {
+; CHECK-LABEL: f:
+; CHECK:       @ %bb.0: @ %entry
+; CHECK-NEXT:  .LBB0_1: @ %bb
+; CHECK-NEXT:    @ =>This Inner Loop Header: Depth=1
+; CHECK-NEXT:    ldrh r1, [r0]
+; CHECK-NEXT:    and r2, r1, #255
+; CHECK-NEXT:    add r3, r2, r1, lsr #8
+; CHECK-NEXT:    add r2, r3, r2
+; CHECK-NEXT:    add r1, r2, r1, lsr #8
+; CHECK-NEXT:    add r1, r1, #2
+; CHECK-NEXT:    lsr r1, r1, #2
+; CHECK-NEXT:    strh r1, [r0]
+; CHECK-NEXT:    b .LBB0_1
+entry:
+  br label %bb
+
+bb:
+  %_p_scalar_ = load i16, i16* %p, align 2
+  %p_and = and i16 %_p_scalar_, 255
+  %p_ = lshr i16 %_p_scalar_, 8
+  %p_add = add nuw nsw i16 %p_, 2
+  %p_add14 = add nuw nsw i16 %p_add, %p_and
+  %p_add18 = add nuw nsw i16 %p_add14, %p_and
+  %p_add19 = add nuw nsw i16 %p_add18, %p_
+  %p_200 = lshr i16 %p_add19, 2
+  store i16 %p_200, i16* %p, align 2
+  br label %bb
+}




More information about the llvm-commits mailing list