[llvm] r367491 - [ARM] Transform compare of masked value to shift on Thumb1.

Eli Friedman via llvm-commits llvm-commits at lists.llvm.org
Wed Jul 31 16:17:35 PDT 2019


Author: efriedma
Date: Wed Jul 31 16:17:34 2019
New Revision: 367491

URL: http://llvm.org/viewvc/llvm-project?rev=367491&view=rev
Log:
[ARM] Transform compare of masked value to shift on Thumb1.

Thumb1 has very limited immediate modes, so turning an "and" into a
shift can save multiple instructions.

It's possible to simplify the generated code for test2 and test3 in
cmp-and-fold.ll a little more, but I'll implement that as a followup.

Differential Revision: https://reviews.llvm.org/D65175


Added:
    llvm/trunk/test/CodeGen/Thumb/cmp-and-fold.ll
Modified:
    llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp

Modified: llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp?rev=367491&r1=367490&r2=367491&view=diff
==============================================================================
--- llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp (original)
+++ llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp Wed Jul 31 16:17:34 2019
@@ -4073,6 +4073,43 @@ SDValue ARMTargetLowering::getARMCmp(SDV
     std::swap(LHS, RHS);
   }
 
+  // Thumb1 has very limited immediate modes, so turning an "and" into a
+  // shift can save multiple instructions.
+  //
+  // If we have (x & C1), and C1 is an appropriate mask, we can transform it
+  // into "((x << n) >> n)".  But that isn't necessarily profitable on its
+  // own. If it's the operand to an unsigned comparison with an immediate,
+  // we can eliminate one of the shifts: we transform
+  // "((x << n) >> n) == C2" to "(x << n) == (C2 << n)".
+  //
+  // We avoid transforming cases which aren't profitable due to encoding
+  // details:
+  //
+  // 1. C2 fits into the immediate field of a cmp, and the transformed version
+  // would not; in that case, we're essentially trading one immediate load for
+  // another.
+  // 2. C1 is 255 or 65535, so we can use uxtb or uxth.
+  // 3. C2 is zero; we have other code for this special case.
+  //
+  // FIXME: Figure out profitability for Thumb2; we usually can't save an
+  // instruction, since the AND is always one instruction anyway, but we could
+  // use narrow instructions in some cases.
+  if (Subtarget->isThumb1Only() && LHS->getOpcode() == ISD::AND &&
+      LHS->hasOneUse() && isa<ConstantSDNode>(LHS.getOperand(1)) &&
+      LHS.getValueType() == MVT::i32 && isa<ConstantSDNode>(RHS) &&
+      !isSignedIntSetCC(CC)) {
+    unsigned Mask = cast<ConstantSDNode>(LHS.getOperand(1))->getZExtValue();
+    auto *RHSC = cast<ConstantSDNode>(RHS.getNode());
+    uint64_t RHSV = RHSC->getZExtValue();
+    if (isMask_32(Mask) && (RHSV & ~Mask) == 0 && Mask != 255 && Mask != 65535) {
+      unsigned ShiftBits = countLeadingZeros(Mask);
+      if (RHSV && (RHSV > 255 || (RHSV << ShiftBits) <= 255)) {
+        SDValue ShiftAmt = DAG.getConstant(ShiftBits, dl, MVT::i32);
+        LHS = DAG.getNode(ISD::SHL, dl, MVT::i32, LHS.getOperand(0), ShiftAmt);
+        RHS = DAG.getConstant(RHSV << ShiftBits, dl, MVT::i32);
+      }
+    }
+  }
   ARMCC::CondCodes CondCode = IntCCToARMCC(CC);
 
   // If the RHS is a constant zero then the V (overflow) flag will never be

Added: llvm/trunk/test/CodeGen/Thumb/cmp-and-fold.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/Thumb/cmp-and-fold.ll?rev=367491&view=auto
==============================================================================
--- llvm/trunk/test/CodeGen/Thumb/cmp-and-fold.ll (added)
+++ llvm/trunk/test/CodeGen/Thumb/cmp-and-fold.ll Wed Jul 31 16:17:34 2019
@@ -0,0 +1,214 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
+; RUN: llc -mtriple=thumbv6-eabi %s -o - | FileCheck %s
+
+define void @test1(i32 %x, void ()* %f)  {
+; CHECK-LABEL: test1:
+; CHECK:       @ %bb.0: @ %entry
+; CHECK-NEXT:    .save {r7, lr}
+; CHECK-NEXT:    push {r7, lr}
+; CHECK-NEXT:    lsls r0, r0, #2
+; CHECK-NEXT:    cmp r0, #68
+; CHECK-NEXT:    beq .LBB0_2
+; CHECK-NEXT:  @ %bb.1: @ %if.then
+; CHECK-NEXT:    blx r1
+; CHECK-NEXT:  .LBB0_2: @ %if.end
+; CHECK-NEXT:    pop {r7, pc}
+entry:
+  %a = and i32 %x, 1073741823
+  %cmp = icmp eq i32 %a, 17
+  br i1 %cmp, label %if.end, label %if.then
+
+if.then:
+  tail call void %f()
+  br label %if.end
+
+if.end:
+  ret void
+}
+
+define void @test2(i32 %x, void ()* %f)  {
+; CHECK-LABEL: test2:
+; CHECK:       @ %bb.0: @ %entry
+; CHECK-NEXT:    .save {r7, lr}
+; CHECK-NEXT:    push {r7, lr}
+; CHECK-NEXT:    movs r2, #1
+; CHECK-NEXT:    lsls r2, r2, #31
+; CHECK-NEXT:    lsls r0, r0, #7
+; CHECK-NEXT:    cmp r0, r2
+; CHECK-NEXT:    bhi .LBB1_2
+; CHECK-NEXT:  @ %bb.1: @ %if.then
+; CHECK-NEXT:    blx r1
+; CHECK-NEXT:  .LBB1_2: @ %if.end
+; CHECK-NEXT:    pop {r7, pc}
+entry:
+  %a = shl i32 %x, 7
+  %cmp = icmp ugt i32 %a, 2147483648
+  br i1 %cmp, label %if.end, label %if.then
+
+if.then:
+  tail call void %f()
+  br label %if.end
+
+if.end:
+  ret void
+}
+
+define void @test3(i32 %x, void ()* %f)  {
+; CHECK-LABEL: test3:
+; CHECK:       @ %bb.0: @ %entry
+; CHECK-NEXT:    .save {r7, lr}
+; CHECK-NEXT:    push {r7, lr}
+; CHECK-NEXT:    movs r2, #1
+; CHECK-NEXT:    lsls r2, r2, #31
+; CHECK-NEXT:    lsls r0, r0, #2
+; CHECK-NEXT:    cmp r0, r2
+; CHECK-NEXT:    bhi .LBB2_2
+; CHECK-NEXT:  @ %bb.1: @ %if.then
+; CHECK-NEXT:    blx r1
+; CHECK-NEXT:  .LBB2_2: @ %if.end
+; CHECK-NEXT:    pop {r7, pc}
+entry:
+  %a = and i32 %x, 1073741823
+  %cmp = icmp ugt i32 %a, 536870912
+  br i1 %cmp, label %if.end, label %if.then
+
+if.then:
+  tail call void %f()
+  br label %if.end
+
+if.end:
+  ret void
+}
+
+define void @test4(i32 %x, void ()* %f)  {
+; CHECK-LABEL: test4:
+; CHECK:       @ %bb.0: @ %entry
+; CHECK-NEXT:    .save {r7, lr}
+; CHECK-NEXT:    push {r7, lr}
+; CHECK-NEXT:    uxtb r0, r0
+; CHECK-NEXT:    cmp r0, #17
+; CHECK-NEXT:    beq .LBB3_2
+; CHECK-NEXT:  @ %bb.1: @ %if.then
+; CHECK-NEXT:    blx r1
+; CHECK-NEXT:  .LBB3_2: @ %if.end
+; CHECK-NEXT:    pop {r7, pc}
+entry:
+  %a = and i32 %x, 255
+  %cmp = icmp eq i32 %a, 17
+  br i1 %cmp, label %if.end, label %if.then
+
+if.then:
+  tail call void %f()
+  br label %if.end
+
+if.end:
+  ret void
+}
+
+define void @test5(i32 %x, void ()* %f)  {
+; CHECK-LABEL: test5:
+; CHECK:       @ %bb.0: @ %entry
+; CHECK-NEXT:    .save {r7, lr}
+; CHECK-NEXT:    push {r7, lr}
+; CHECK-NEXT:    uxth r0, r0
+; CHECK-NEXT:    cmp r0, #17
+; CHECK-NEXT:    beq .LBB4_2
+; CHECK-NEXT:  @ %bb.1: @ %if.then
+; CHECK-NEXT:    blx r1
+; CHECK-NEXT:  .LBB4_2: @ %if.end
+; CHECK-NEXT:    pop {r7, pc}
+entry:
+  %a = and i32 %x, 65535
+  %cmp = icmp eq i32 %a, 17
+  br i1 %cmp, label %if.end, label %if.then
+
+if.then:
+  tail call void %f()
+  br label %if.end
+
+if.end:
+  ret void
+}
+
+define void @test6(i32 %x, void ()* %f)  {
+; CHECK-LABEL: test6:
+; CHECK:       @ %bb.0: @ %entry
+; CHECK-NEXT:    .save {r7, lr}
+; CHECK-NEXT:    push {r7, lr}
+; CHECK-NEXT:    movs r2, #32
+; CHECK-NEXT:    ands r2, r0
+; CHECK-NEXT:    cmp r2, #17
+; CHECK-NEXT:    beq .LBB5_2
+; CHECK-NEXT:  @ %bb.1: @ %if.then
+; CHECK-NEXT:    blx r1
+; CHECK-NEXT:  .LBB5_2: @ %if.end
+; CHECK-NEXT:    pop {r7, pc}
+entry:
+  %a = and i32 %x, 32
+  %cmp = icmp eq i32 %a, 17
+  br i1 %cmp, label %if.end, label %if.then
+
+if.then:
+  tail call void %f()
+  br label %if.end
+
+if.end:
+  ret void
+}
+
+define void @test7(i32 %x, void ()* %f)  {
+; CHECK-LABEL: test7:
+; CHECK:       @ %bb.0: @ %entry
+; CHECK-NEXT:    .save {r7, lr}
+; CHECK-NEXT:    push {r7, lr}
+; CHECK-NEXT:    ldr r2, .LCPI6_0
+; CHECK-NEXT:    ands r2, r0
+; CHECK-NEXT:    cmp r2, #17
+; CHECK-NEXT:    beq .LBB6_2
+; CHECK-NEXT:  @ %bb.1: @ %if.then
+; CHECK-NEXT:    blx r1
+; CHECK-NEXT:  .LBB6_2: @ %if.end
+; CHECK-NEXT:    pop {r7, pc}
+; CHECK-NEXT:    .p2align 2
+; CHECK-NEXT:  @ %bb.3:
+; CHECK-NEXT:  .LCPI6_0:
+; CHECK-NEXT:    .long 1023 @ 0x3ff
+entry:
+  %a = and i32 %x, 1023
+  %cmp = icmp eq i32 %a, 17
+  br i1 %cmp, label %if.end, label %if.then
+
+if.then:
+  tail call void %f()
+  br label %if.end
+
+if.end:
+  ret void
+}
+
+define void @test8(i32 %x, void ()* %f)  {
+; CHECK-LABEL: test8:
+; CHECK:       @ %bb.0: @ %entry
+; CHECK-NEXT:    .save {r7, lr}
+; CHECK-NEXT:    push {r7, lr}
+; CHECK-NEXT:    movs r2, #129
+; CHECK-NEXT:    lsls r2, r2, #23
+; CHECK-NEXT:    lsls r0, r0, #22
+; CHECK-NEXT:    cmp r0, r2
+; CHECK-NEXT:    beq .LBB7_2
+; CHECK-NEXT:  @ %bb.1: @ %if.then
+; CHECK-NEXT:    blx r1
+; CHECK-NEXT:  .LBB7_2: @ %if.end
+; CHECK-NEXT:    pop {r7, pc}
+entry:
+  %a = and i32 %x, 1023
+  %cmp = icmp eq i32 %a, 258
+  br i1 %cmp, label %if.end, label %if.then
+
+if.then:
+  tail call void %f()
+  br label %if.end
+
+if.end:
+  ret void
+}




More information about the llvm-commits mailing list