[llvm-commits] [llvm] r118204 - in /llvm/trunk: lib/Target/ARM/ARMISelLowering.cpp test/CodeGen/ARM/vbits.ll test/MC/ARM/neon-bitwise-encoding.s

Wed Nov 3 16:32:38 PDT 2010

Thanks, Owen.  I like this better.

The "setTargetDAGCombine(ISD::OR)" call is currently guarded by Subtarget->hasV6T2Ops(); it would be good to also call that for Subtarget->hasNEON().

The isNEONModifiedImm function currently distinguishes VMOV vs. non-VMOV immediates.  The encodings with cmode=1100 and 1101 are only available with VMOV and VMVN, so you need to add another parameter or change "isVMOV" to be an enum so that it can distinguish VORR/VBIC from VMOV/VMVN for those encodings.

On Nov 3, 2010, at 4:15 PM, Owen Anderson wrote:

> Author: resistor
> Date: Wed Nov  3 18:15:26 2010
> New Revision: 118204
> 
> URL: http://llvm.org/viewvc/llvm-project?rev=118204&view=rev
> Log:
> Covert VORRIMM to be produced via early target-specific DAG combining, rather than legalization.
> This is both the conceptually correct place for it, as well as allowing it to be more aggressive.
> 
> Modified:
>    llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp
>    llvm/trunk/test/CodeGen/ARM/vbits.ll
>    llvm/trunk/test/MC/ARM/neon-bitwise-encoding.s
> 
> Modified: llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp?rev=118204&r1=118203&r2=118204&view=diff
> ==============================================================================
> --- llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp (original)
> +++ llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp Wed Nov  3 18:15:26 2010
> @@ -101,7 +101,6 @@
>     setOperationAction(ISD::SHL, VT.getSimpleVT(), Custom);
>     setOperationAction(ISD::SRA, VT.getSimpleVT(), Custom);
>     setOperationAction(ISD::SRL, VT.getSimpleVT(), Custom);
> -    setOperationAction(ISD::OR, VT.getSimpleVT(), Custom);
>     setLoadExtAction(ISD::SEXTLOAD, VT.getSimpleVT(), Expand);
>     setLoadExtAction(ISD::ZEXTLOAD, VT.getSimpleVT(), Expand);
>     for (unsigned InnerVT = (unsigned)MVT::FIRST_VECTOR_VALUETYPE;
> @@ -3433,32 +3432,6 @@
>   return SDValue();
> }
> 
> -static SDValue LowerOR(SDValue Op, SelectionDAG &DAG) {
> -  SDValue Op1 = Op.getOperand(1);
> -  while (Op1.getOpcode() == ISD::BIT_CONVERT && Op1.getOperand(0) != Op1)
> -    Op1 = Op1.getOperand(0);
> -  if (Op1.getOpcode() != ARMISD::VMOVIMM) return Op;
> -  
> -  ConstantSDNode* TargetConstant = cast<ConstantSDNode>(Op1.getOperand(0));
> -  uint32_t ConstVal = TargetConstant->getZExtValue();
> -
> -  // FIXME: VORRIMM only supports immediate encodings of 16 and 32 bit size.
> -  // In theory for VMOVIMMs whose value is already encoded as with an
> -  // 8 bit encoding, we could re-encode it as a 16 or 32 bit immediate.
> -  EVT VorrVT = Op1.getValueType();
> -  EVT EltVT = VorrVT.getVectorElementType();
> -  if (EltVT != MVT::i16 && EltVT != MVT::i32) return Op;
> -  
> -  ConstVal |= 0x0100;
> -  SDValue OrConst = DAG.getTargetConstant(ConstVal, MVT::i32);
> -  
> -  DebugLoc dl = Op.getDebugLoc();
> -  EVT VT = Op.getValueType();
> -  SDValue toTy = DAG.getNode(ISD::BIT_CONVERT, dl, VorrVT, Op.getOperand(0));
> -  SDValue Vorr = DAG.getNode(ARMISD::VORRIMM, dl, VorrVT, toTy, OrConst);
> -  return DAG.getNode(ISD::BIT_CONVERT, dl, VT, Vorr);
> -}
> -
> // If this is a case we can't handle, return null and let the default
> // expansion code take care of it.
> static SDValue LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG,
> @@ -3927,7 +3900,6 @@
>   case ISD::CONCAT_VECTORS: return LowerCONCAT_VECTORS(Op, DAG);
>   case ISD::FLT_ROUNDS_:   return LowerFLT_ROUNDS_(Op, DAG);
>   case ISD::MUL:           return LowerMUL(Op, DAG);
> -  case ISD::OR:            return LowerOR(Op, DAG);
>   }
>   return SDValue();
> }
> @@ -4474,6 +4446,31 @@
> static SDValue PerformORCombine(SDNode *N,
>                                 TargetLowering::DAGCombinerInfo &DCI,
>                                 const ARMSubtarget *Subtarget) {
> +  // Attempt to use immediate-form VORR
> +  BuildVectorSDNode *BVN = dyn_cast<BuildVectorSDNode>(N->getOperand(1));
> +  DebugLoc dl = N->getDebugLoc();
> +  EVT VT = N->getValueType(0);
> +  SelectionDAG &DAG = DCI.DAG;
> +  
> +  APInt SplatBits, SplatUndef;
> +  unsigned SplatBitSize;
> +  bool HasAnyUndefs;
> +  if (BVN && Subtarget->hasNEON() &&
> +      BVN->isConstantSplat(SplatBits, SplatUndef, SplatBitSize, HasAnyUndefs)) {
> +    if (SplatBitSize <= 64) {
> +      EVT VorrVT;
> +      SDValue Val = isNEONModifiedImm(SplatBits.getZExtValue(),
> +                                      SplatUndef.getZExtValue(), SplatBitSize,
> +                                      DAG, VorrVT, VT.is128BitVector(), false);
> +      if (Val.getNode()) {
> +        SDValue Input =
> +          DAG.getNode(ISD::BIT_CONVERT, dl, VorrVT, N->getOperand(0));
> +        SDValue Vorr = DAG.getNode(ARMISD::VORRIMM, dl, VorrVT, Input, Val);
> +        return DAG.getNode(ISD::BIT_CONVERT, dl, VT, Vorr);
> +      }
> +    }
> +  }
> +
>   // Try to use the ARM/Thumb2 BFI (bitfield insert) instruction when
>   // reasonable.
> 
> @@ -4481,7 +4478,6 @@
>   if (Subtarget->isThumb1Only() || !Subtarget->hasV6T2Ops())
>     return SDValue();
> 
> -  SelectionDAG &DAG = DCI.DAG;
>   SDValue N0 = N->getOperand(0), N1 = N->getOperand(1);
>   DebugLoc DL = N->getDebugLoc();
>   // 1) or (and A, mask), val => ARMbfi A, val, mask
> @@ -4496,7 +4492,6 @@
>   if (N0.getOpcode() != ISD::AND)
>     return SDValue();
> 
> -  EVT VT = N->getValueType(0);
>   if (VT != MVT::i32)
>     return SDValue();
> 
> @@ -4565,7 +4560,7 @@
>       DCI.CombineTo(N, Res, false);
>     }
>   }
> -
> +  
>   return SDValue();
> }
> 
> 
> Modified: llvm/trunk/test/CodeGen/ARM/vbits.ll
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/ARM/vbits.ll?rev=118204&r1=118203&r2=118204&view=diff
> ==============================================================================
> --- llvm/trunk/test/CodeGen/ARM/vbits.ll (original)
> +++ llvm/trunk/test/CodeGen/ARM/vbits.ll Wed Nov  3 18:15:26 2010
> @@ -1,4 +1,4 @@
> -; RUN: llc < %s -march=arm -mattr=+neon | FileCheck %s
> +; RUN: llc < %s -march=arm -mattr=+neon -mcpu=cortex-a8 | FileCheck %s
> 
> define <8 x i8> @v_andi8(<8 x i8>* %A, <8 x i8>* %B) nounwind {
> ;CHECK: v_andi8:
> 
> Modified: llvm/trunk/test/MC/ARM/neon-bitwise-encoding.s
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/MC/ARM/neon-bitwise-encoding.s?rev=118204&r1=118203&r2=118204&view=diff
> ==============================================================================
> --- llvm/trunk/test/MC/ARM/neon-bitwise-encoding.s (original)
> +++ llvm/trunk/test/MC/ARM/neon-bitwise-encoding.s Wed Nov  3 18:15:26 2010
> @@ -19,6 +19,8 @@
>   vorr.i32	d16, #0x1000000
> @ CHECK: vorr.i32	q8, #0x1000000  @ encoding: [0x51,0x07,0xc0,0xf2]
>   vorr.i32	q8, #0x1000000
> +@ CHECK: vorr.i32	q8, #0x0        @ encoding: [0x50,0x01,0xc0,0xf2]
> +  vorr.i32	q8, #0x0
> 
> @ CHECK: vbic	d16, d17, d16           @ encoding: [0xb0,0x01,0x51,0xf2]
> 	vbic	d16, d17, d16
> 
> 
> _______________________________________________
> llvm-commits mailing list
> llvm-commits at cs.uiuc.edu
> http://lists.cs.uiuc.edu/mailman/listinfo/llvm-commits