[llvm] r340446 - [ARM] Handle all-ones mask explicitly in targetShrinkDemandedConstant.
Eli Friedman via llvm-commits
llvm-commits at lists.llvm.org
Wed Aug 22 13:13:46 PDT 2018
Author: efriedma
Date: Wed Aug 22 13:13:45 2018
New Revision: 340446
URL: http://llvm.org/viewvc/llvm-project?rev=340446&view=rev
Log:
[ARM] Handle all-ones mask explicitly in targetShrinkDemandedConstant.
This avoids a potential infinite loop setting and unsetting bits in the
mask.
Reduced from a failure on the polly-aosp bot.
Differential Revision: https://reviews.llvm.org/D51066
Added:
llvm/trunk/test/CodeGen/ARM/demanded-bits-and.ll
Modified:
llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp
Modified: llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp?rev=340446&r1=340445&r2=340446&view=diff
==============================================================================
--- llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp (original)
+++ llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp Wed Aug 22 13:13:45 2018
@@ -13647,14 +13647,21 @@ ARMTargetLowering::targetShrinkDemandedC
unsigned Mask = C->getZExtValue();
- // If mask is zero, nothing to do.
- if (!Mask)
- return false;
-
unsigned Demanded = DemandedAPInt.getZExtValue();
unsigned ShrunkMask = Mask & Demanded;
unsigned ExpandedMask = Mask | ~Demanded;
+ // If the mask is all zeros, let the target-independent code replace the
+ // result with zero.
+ if (ShrunkMask == 0)
+ return false;
+
+ // If the mask is all ones, erase the AND. (Currently, the target-independent
+ // code won't do this, so we have to do it explicitly to avoid an infinite
+ // loop in obscure cases.)
+ if (ExpandedMask == ~0U)
+ return TLO.CombineTo(Op, Op.getOperand(0));
+
auto IsLegalMask = [ShrunkMask, ExpandedMask](unsigned Mask) -> bool {
return (ShrunkMask & Mask) == ShrunkMask && (~ExpandedMask & Mask) == 0;
};
Added: llvm/trunk/test/CodeGen/ARM/demanded-bits-and.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/ARM/demanded-bits-and.ll?rev=340446&view=auto
==============================================================================
--- llvm/trunk/test/CodeGen/ARM/demanded-bits-and.ll (added)
+++ llvm/trunk/test/CodeGen/ARM/demanded-bits-and.ll Wed Aug 22 13:13:45 2018
@@ -0,0 +1,35 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
+; RUN: llc -mtriple=arm-eabi < %s | FileCheck %s
+
+; Make sure this doesn't hang, and there are no unnecessary
+; "and" instructions.
+
+define dso_local void @f(i16* %p) {
+; CHECK-LABEL: f:
+; CHECK: @ %bb.0: @ %entry
+; CHECK-NEXT: .LBB0_1: @ %bb
+; CHECK-NEXT: @ =>This Inner Loop Header: Depth=1
+; CHECK-NEXT: ldrh r1, [r0]
+; CHECK-NEXT: and r2, r1, #255
+; CHECK-NEXT: add r3, r2, r1, lsr #8
+; CHECK-NEXT: add r2, r3, r2
+; CHECK-NEXT: add r1, r2, r1, lsr #8
+; CHECK-NEXT: add r1, r1, #2
+; CHECK-NEXT: lsr r1, r1, #2
+; CHECK-NEXT: strh r1, [r0]
+; CHECK-NEXT: b .LBB0_1
+entry:
+ br label %bb
+
+bb:
+ %_p_scalar_ = load i16, i16* %p, align 2
+ %p_and = and i16 %_p_scalar_, 255
+ %p_ = lshr i16 %_p_scalar_, 8
+ %p_add = add nuw nsw i16 %p_, 2
+ %p_add14 = add nuw nsw i16 %p_add, %p_and
+ %p_add18 = add nuw nsw i16 %p_add14, %p_and
+ %p_add19 = add nuw nsw i16 %p_add18, %p_
+ %p_200 = lshr i16 %p_add19, 2
+ store i16 %p_200, i16* %p, align 2
+ br label %bb
+}
More information about the llvm-commits
mailing list