[llvm-commits] [llvm] r141365 - in /llvm/trunk: lib/Target/ARM/ARMISelDAGToDAG.cpp lib/Target/ARM/ARMISelLowering.cpp lib/Target/ARM/ARMInstrInfo.td lib/Target/ARM/ARMInstrThumb2.td test/CodeGen/ARM/iabs.ll test/CodeGen/Thumb/iabs.ll

Tobias Grosser tobias at grosser.es
Fri Oct 7 10:14:36 PDT 2011


On 10/07/2011 05:15 PM, Anton Korobeynikov wrote:
> Author: asl
> Date: Fri Oct  7 11:15:08 2011
> New Revision: 141365
>
> URL: http://llvm.org/viewvc/llvm-project?rev=141365&view=rev
> Log:
> Peephole optimization for ABS on ARM.
> Patch by Ana Pazos!

Some nit picking inline.

Tobi

>
> Modified:
>      llvm/trunk/lib/Target/ARM/ARMISelDAGToDAG.cpp
>      llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp
>      llvm/trunk/lib/Target/ARM/ARMInstrInfo.td
>      llvm/trunk/lib/Target/ARM/ARMInstrThumb2.td
>      llvm/trunk/test/CodeGen/ARM/iabs.ll
>      llvm/trunk/test/CodeGen/Thumb/iabs.ll
>
> Modified: llvm/trunk/lib/Target/ARM/ARMISelDAGToDAG.cpp
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ARMISelDAGToDAG.cpp?rev=141365&r1=141364&r2=141365&view=diff
> ==============================================================================
> --- llvm/trunk/lib/Target/ARM/ARMISelDAGToDAG.cpp (original)
> +++ llvm/trunk/lib/Target/ARM/ARMISelDAGToDAG.cpp Fri Oct  7 11:15:08 2011
> @@ -47,6 +47,11 @@
>     cl::desc("Check fp vmla / vmls hazard at isel time"),
>     cl::init(true));
>
> +static cl::opt<bool>
> +DisableARMIntABS("disable-arm-int-abs", cl::Hidden,
> +  cl::desc("Enable / disable ARM integer abs transform"),
> +  cl::init(false));
> +
>   //===--------------------------------------------------------------------===//
>   /// ARMDAGToDAGISel - ARM specific code to select ARM machine
>   /// instructions for SelectionDAG operations.
> @@ -252,6 +257,9 @@
>                                  ARMCC::CondCodes CCVal, SDValue CCR,
>                                  SDValue InFlag);
>
> +  // Select special operations if node forms integer ABS pattern
> +  SDNode *SelectABSOp(SDNode *N);
> +
>     SDNode *SelectConcatVector(SDNode *N);
>
>     SDNode *SelectAtomic64(SDNode *Node, unsigned Opc);
> @@ -2295,6 +2303,53 @@
>     return CurDAG->SelectNodeTo(N, Opc, VT, Ops, 5);
>   }
>
> +/// Target-specific DAG combining for ISD::XOR.
> +/// Target-independent combining lowers SELECT_CC nodes of the form
> +/// select_cc setg[ge] X,  0,  X, -X
> +/// select_cc setgt    X, -1,  X, -X
> +/// select_cc setl[te] X,  0, -X,  X
> +/// select_cc setlt    X,  1, -X,  X
> +/// which represent Integer ABS into:
> +/// Y = sra (X, size(X)-1); xor (add (X, Y), Y)
> +/// ARM instruction selection detects the latter and matches it to
> +/// ARM::ABS or ARM::t2ABS machine node.
> +SDNode *ARMDAGToDAGISel::SelectABSOp(SDNode *N){
> +  SDValue XORSrc0 = N->getOperand(0);
> +  SDValue XORSrc1 = N->getOperand(1);
> +  DebugLoc DL = N->getDebugLoc();
> +  EVT VT = N->getValueType(0);
> +
> +  if (DisableARMIntABS)
> +    return NULL;
> +
> +  if (XORSrc0.getOpcode() != ISD::ADD ||
> +    XORSrc1.getOpcode() != ISD::SRA)
> +    return NULL;
> +
> +  SDValue ADDSrc0 = XORSrc0.getOperand(0);
> +  SDValue ADDSrc1 = XORSrc0.getOperand(1);
> +  SDValue SRASrc0 = XORSrc1.getOperand(0);
> +  SDValue SRASrc1 = XORSrc1.getOperand(1);
> +  ConstantSDNode *SRAConstant =  dyn_cast<ConstantSDNode>(SRASrc1);
> +  EVT XType = SRASrc0.getValueType();
> +  unsigned Size = XType.getSizeInBits() - 1;
> +
> +  if (ADDSrc1 == XORSrc1&&
> +      ADDSrc0 == SRASrc0&&
> +      XType.isInteger()&&
> +      SRAConstant != NULL&&
> +      Size == SRAConstant->getZExtValue()) {
> +
> +    unsigned Opcode = ARM::ABS;
> +    if (Subtarget->isThumb2())
> +      Opcode = ARM::t2ABS;
> +
> +    return CurDAG->SelectNodeTo(N, Opcode, VT, ADDSrc0);
> +  }
> +
> +  return NULL;
> +}
> +
>   SDNode *ARMDAGToDAGISel::SelectConcatVector(SDNode *N) {
>     // The only time a CONCAT_VECTORS operation can have legal types is when
>     // two 64-bit vectors are concatenated to a 128-bit vector.
> @@ -2331,6 +2386,14 @@
>
>     switch (N->getOpcode()) {
>     default: break;
> +  case ISD::XOR: {
> +    // Select special operations if XOR node forms integer ABS pattern
> +    SDNode *ResNode = SelectABSOp(N);
> +    if (ResNode)
> +      return ResNode;
> +    // Other cases are autogenerated.
> +    break;
> +  }
>     case ISD::Constant: {
>       unsigned Val = cast<ConstantSDNode>(N)->getZExtValue();
>       bool UseCP = true;
>
> Modified: llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp?rev=141365&r1=141364&r2=141365&view=diff
> ==============================================================================
> --- llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp (original)
> +++ llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp Fri Oct  7 11:15:08 2011
> @@ -6100,6 +6100,86 @@
>       MI->eraseFromParent();   // The pseudo instruction is gone now.
>       return BB;
>     }
> +
> +  case ARM::ABS:
> +  case ARM::t2ABS: {
> +    // To insert an ABS instruction, we have to insert the
> +    // diamond control-flow pattern.  The incoming instruction knows the
> +    // source vreg to test against 0, the destination vreg to set,

I do not get this sentence 'The incoming instruction knows the source 
vreg to test against 0'. Can this be rephrased?

> +    // the condition code register to branch on, the
> +    // true/false values to select between, and a branch opcode to use.
> +    // It transforms
> +    //     V1 = ABS V0
> +    // into
> +    //     V2 = MOVS V0
> +    //     BCC                      (branch to SinkBB if V0>= 0)
> +    //     RSBBB: V3 = RSBri V2, 0  (compute ABS if V2<  0)
> +    //     SinkBB: V1 = PHI(V2, V3)
> +    const BasicBlock *LLVM_BB = BB->getBasicBlock();
> +    MachineFunction::iterator BBI = BB;
> +    ++BBI;
> +    MachineFunction *Fn = BB->getParent();
> +    MachineBasicBlock *RSBBB = Fn->CreateMachineBasicBlock(LLVM_BB);
> +    MachineBasicBlock *SinkBB  = Fn->CreateMachineBasicBlock(LLVM_BB);
> +    Fn->insert(BBI, RSBBB);
> +    Fn->insert(BBI, SinkBB);
> +
> +    unsigned int ABSSrcReg = MI->getOperand(1).getReg();
> +    unsigned int ABSDstReg = MI->getOperand(0).getReg();
> +    bool isThumb2 = Subtarget->isThumb2();
> +    MachineRegisterInfo&MRI = Fn->getRegInfo();
> +    // In Thumb mode S must not be specified if source register is the SP or
> +    // PC and if destination register is the SP, so restrict register class
> +    unsigned NewMovDstReg = MRI.createVirtualRegister(
> +      isThumb2 ? ARM::rGPRRegisterClass : ARM::GPRRegisterClass);
> +    unsigned NewRsbDstReg = MRI.createVirtualRegister(
> +      isThumb2 ? ARM::rGPRRegisterClass : ARM::GPRRegisterClass);
> +
> +    // Transfer the remainder of BB and its successor edges to sinkMBB.
> +    SinkBB->splice(SinkBB->begin(), BB,
> +      llvm::next(MachineBasicBlock::iterator(MI)),
> +      BB->end());
> +    SinkBB->transferSuccessorsAndUpdatePHIs(BB);
> +
> +    BB->addSuccessor(RSBBB);
> +    BB->addSuccessor(SinkBB);
> +
> +    // fall through to SinkMBB
> +    RSBBB->addSuccessor(SinkBB);
> +
> +    // insert a movs at the end of BB
> +    BuildMI(BB, dl, TII->get(isThumb2 ? ARM::t2MOVr : ARM::MOVr),
> +      NewMovDstReg)
> +      .addReg(ABSSrcReg, RegState::Kill)
> +      .addImm((unsigned)ARMCC::AL).addReg(0)
> +      .addReg(ARM::CPSR, RegState::Define);
> +
> +    // insert a bcc with opposite CC to ARMCC::MI at the end of BB
> +    BuildMI(BB, dl,
> +      TII->get(isThumb2 ? ARM::t2Bcc : ARM::Bcc)).addMBB(SinkBB)
> +      .addImm(ARMCC::getOppositeCondition(ARMCC::MI)).addReg(ARM::CPSR);
> +
> +    // insert rsbri in RSBBB
> +    // Note: BCC and rsbri will be converted into predicated rsbmi
> +    // by if-conversion pass
> +    BuildMI(*RSBBB, RSBBB->begin(), dl,
> +      TII->get(isThumb2 ? ARM::t2RSBri : ARM::RSBri), NewRsbDstReg)
> +      .addReg(NewMovDstReg, RegState::Kill)
> +      .addImm(0).addImm((unsigned)ARMCC::AL).addReg(0).addReg(0);
> +
> +    // insert PHI in SinkBB,
> +    // reuse ABSDstReg to not change uses of ABS instruction
> +    BuildMI(*SinkBB, SinkBB->begin(), dl,
> +      TII->get(ARM::PHI), ABSDstReg)
> +      .addReg(NewRsbDstReg).addMBB(RSBBB)
> +      .addReg(NewMovDstReg).addMBB(BB);
> +
> +    // remove ABS instruction
> +    MI->eraseFromParent();
> +
> +    // return last added BB
> +    return SinkBB;
> +  }
>     }
>   }
>
>
> Modified: llvm/trunk/lib/Target/ARM/ARMInstrInfo.td
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ARMInstrInfo.td?rev=141365&r1=141364&r2=141365&view=diff
> ==============================================================================
> --- llvm/trunk/lib/Target/ARM/ARMInstrInfo.td (original)
> +++ llvm/trunk/lib/Target/ARM/ARMInstrInfo.td Fri Oct  7 11:15:08 2011
> @@ -2848,6 +2848,9 @@
>     let Inst{15-12} = Rd;
>   }
>
> +def : ARMInstAlias<"movs${p} $Rd, $Rm",
> +                   (MOVr GPR:$Rd, GPR:$Rm, pred:$p, CPSR)>;
> +
>   // A version for the smaller set of tail call registers.
>   let neverHasSideEffects = 1 in
>   def MOVr_TC : AsI1<0b1101, (outs tcGPR:$Rd), (ins tcGPR:$Rm), DPFrm,
> @@ -4025,6 +4028,14 @@
>     let Inst{3-0} = opt;
>   }
>
> +// Pseudo isntruction that combines movs + predicated rsbmi
Type: 'instruction'

> +// to implement integer ABS
> +let usesCustomInserter = 1, Defs = [CPSR] in {
> +def ABS : ARMPseudoInst<
> +  (outs GPR:$dst), (ins GPR:$src),
> +  8, NoItinerary, []>;
> +}
> +
>   let usesCustomInserter = 1 in {
>     let Defs = [CPSR] in {
>       def ATOMIC_LOAD_ADD_I8 : PseudoInst<
>
> Modified: llvm/trunk/lib/Target/ARM/ARMInstrThumb2.td
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ARMInstrThumb2.td?rev=141365&r1=141364&r2=141365&view=diff
> ==============================================================================
> --- llvm/trunk/lib/Target/ARM/ARMInstrThumb2.td (original)
> +++ llvm/trunk/lib/Target/ARM/ARMInstrThumb2.td Fri Oct  7 11:15:08 2011
> @@ -3433,6 +3433,14 @@
>                 [(set rGPR:$dst, (ARMpic_add (load (ARMWrapper tconstpool:$addr)),
>                                              imm:$cp))]>,
>                  Requires<[IsThumb2]>;
> +
> +// Pseudo isntruction that combines movs + predicated rsbmi

Type: 'instruction'

> +// to implement integer ABS
> +let usesCustomInserter = 1, Defs = [CPSR] in {
> +def t2ABS : PseudoInst<(outs rGPR:$dst), (ins rGPR:$src),
> +                       NoItinerary, []>, Requires<[IsThumb2]>;
> +}
> +
>   //===----------------------------------------------------------------------===//
>   // Coprocessor load/store -- for disassembly only
>   //
>
> Modified: llvm/trunk/test/CodeGen/ARM/iabs.ll
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/ARM/iabs.ll?rev=141365&r1=141364&r2=141365&view=diff
> ==============================================================================
> --- llvm/trunk/test/CodeGen/ARM/iabs.ll (original)
> +++ llvm/trunk/test/CodeGen/ARM/iabs.ll Fri Oct  7 11:15:08 2011
> @@ -1,8 +1,8 @@
>   ; RUN: llc<  %s -march=arm -mattr=+v4t | FileCheck %s
>
>   ;; Integer absolute value, should produce something as good as: ARM:
> -;;   add r3, r0, r0, asr #31
> -;;   eor r0, r3, r0, asr #31
> +;;   movs r0, r0
> +;;   rsbmi r0, r0, #0
>   ;;   bx lr
>
>   define i32 @test(i32 %a) {
> @@ -10,7 +10,7 @@
>           %b = icmp sgt i32 %a, -1
>           %abs = select i1 %b, i32 %a, i32 %tmp1neg
>           ret i32 %abs
> -; CHECK:   add r1, r0, r0, asr #31
> -; CHECK:   eor r0, r1, r0, asr #31
> +; CHECK:  movs r0, r0
> +; CHECK:  rsbmi r0, r0, #0
>   ; CHECK:  bx lr
>   }
>
> Modified: llvm/trunk/test/CodeGen/Thumb/iabs.ll
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/Thumb/iabs.ll?rev=141365&r1=141364&r2=141365&view=diff
> ==============================================================================
> --- llvm/trunk/test/CodeGen/Thumb/iabs.ll (original)
> +++ llvm/trunk/test/CodeGen/Thumb/iabs.ll Fri Oct  7 11:15:08 2011
> @@ -3,9 +3,9 @@
>
>   ;; Integer absolute value, should produce something as good as:
>   ;; Thumb:
> -;;   asr r2, r0, #31
> -;;   add r0, r0, r2
> -;;   eor r0, r2
> +;;   movs r0, r0
> +;;   bpl
> +;;   rsb r0, r0, #0 (with opitmization, bpl + rsb is if-converted into rsbmi)

Type 'optimization'




More information about the llvm-commits mailing list