[llvm] r182364 - X86: When emulating unsigned PCMPGTQ with PCMPGTD, fix the sign bit for the smaller type.

Benjamin Kramer benny.kra at gmail.com
Tue May 21 03:11:55 PDT 2013


On 21.05.2013, at 11:58, Benjamin Kramer <benny.kra at googlemail.com> wrote:

> Author: d0k
> Date: Tue May 21 04:58:54 2013
> New Revision: 182364
> 
> URL: http://llvm.org/viewvc/llvm-project?rev=182364&view=rev
> Log:
> X86: When emulating unsigned PCMPGTQ with PCMPGTD, fix the sign bit for the smaller type.
> 
> Otherwise we'll get a mix of signed and unsigned compares.
> Fixes PR15977.

This fixes a regression and should go into 3.3.

- Ben

> 
> Modified:
>    llvm/trunk/lib/Target/X86/X86ISelLowering.cpp
>    llvm/trunk/test/CodeGen/X86/vec_compare.ll
> 
> Modified: llvm/trunk/lib/Target/X86/X86ISelLowering.cpp
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/X86/X86ISelLowering.cpp?rev=182364&r1=182363&r2=182364&view=diff
> ==============================================================================
> --- llvm/trunk/lib/Target/X86/X86ISelLowering.cpp (original)
> +++ llvm/trunk/lib/Target/X86/X86ISelLowering.cpp Tue May 21 04:58:54 2013
> @@ -9347,29 +9347,24 @@ static SDValue LowerVSETCC(SDValue Op, c
>   if (Swap)
>     std::swap(Op0, Op1);
> 
> -  // Since SSE has no unsigned integer comparisons, we need to flip  the sign
> -  // bits of the inputs before performing those operations.
> -  if (FlipSigns) {
> -    EVT EltVT = VT.getVectorElementType();
> -    SDValue SignBit = DAG.getConstant(APInt::getSignBit(EltVT.getSizeInBits()),
> -                                      EltVT);
> -    std::vector<SDValue> SignBits(VT.getVectorNumElements(), SignBit);
> -    SDValue SignVec = DAG.getNode(ISD::BUILD_VECTOR, dl, VT, &SignBits[0],
> -                                    SignBits.size());
> -    Op0 = DAG.getNode(ISD::XOR, dl, VT, Op0, SignVec);
> -    Op1 = DAG.getNode(ISD::XOR, dl, VT, Op1, SignVec);
> -  }
> -
>   // Check that the operation in question is available (most are plain SSE2,
>   // but PCMPGTQ and PCMPEQQ have different requirements).
>   if (VT == MVT::v2i64) {
>     if (Opc == X86ISD::PCMPGT && !Subtarget->hasSSE42()) {
>       assert(Subtarget->hasSSE2() && "Don't know how to lower!");
> 
> -      // First cast everything to the right type,
> +      // First cast everything to the right type.
>       Op0 = DAG.getNode(ISD::BITCAST, dl, MVT::v4i32, Op0);
>       Op1 = DAG.getNode(ISD::BITCAST, dl, MVT::v4i32, Op1);
> 
> +      // Since SSE has no unsigned integer comparisons, we need to flip the sign
> +      // bits of the inputs before performing those operations.
> +      if (FlipSigns) {
> +        SDValue SB = DAG.getConstant(0x80000000U, MVT::v4i32);
> +        Op0 = DAG.getNode(ISD::XOR, dl, MVT::v4i32, Op0, SB);
> +        Op1 = DAG.getNode(ISD::XOR, dl, MVT::v4i32, Op1, SB);
> +      }
> +
>       // Emulate PCMPGTQ with (hi1 > hi2) | ((hi1 == hi2) & (lo1 > lo2))
>       SDValue GT = DAG.getNode(X86ISD::PCMPGT, dl, MVT::v4i32, Op0, Op1);
>       SDValue EQ = DAG.getNode(X86ISD::PCMPEQ, dl, MVT::v4i32, Op0, Op1);
> @@ -9395,7 +9390,7 @@ static SDValue LowerVSETCC(SDValue Op, c
>       // pcmpeqd + pshufd + pand.
>       assert(Subtarget->hasSSE2() && !FlipSigns && "Don't know how to lower!");
> 
> -      // First cast everything to the right type,
> +      // First cast everything to the right type.
>       Op0 = DAG.getNode(ISD::BITCAST, dl, MVT::v4i32, Op0);
>       Op1 = DAG.getNode(ISD::BITCAST, dl, MVT::v4i32, Op1);
> 
> @@ -9414,6 +9409,15 @@ static SDValue LowerVSETCC(SDValue Op, c
>     }
>   }
> 
> +  // Since SSE has no unsigned integer comparisons, we need to flip the sign
> +  // bits of the inputs before performing those operations.
> +  if (FlipSigns) {
> +    EVT EltVT = VT.getVectorElementType();
> +    SDValue SB = DAG.getConstant(APInt::getSignBit(EltVT.getSizeInBits()), VT);
> +    Op0 = DAG.getNode(ISD::XOR, dl, VT, Op0, SB);
> +    Op1 = DAG.getNode(ISD::XOR, dl, VT, Op1, SB);
> +  }
> +
>   SDValue Result = DAG.getNode(Opc, dl, VT, Op0, Op1);
> 
>   // If the logical-not of the result is required, perform that now.
> 
> Modified: llvm/trunk/test/CodeGen/X86/vec_compare.ll
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/X86/vec_compare.ll?rev=182364&r1=182363&r2=182364&view=diff
> ==============================================================================
> --- llvm/trunk/test/CodeGen/X86/vec_compare.ll (original)
> +++ llvm/trunk/test/CodeGen/X86/vec_compare.ll Tue May 21 04:58:54 2013
> @@ -131,9 +131,15 @@ define <2 x i64> @test10(<2 x i64> %A, <
> }
> 
> define <2 x i64> @test11(<2 x i64> %A, <2 x i64> %B) nounwind {
> +; CHECK: [[CONSTSEG:[A-Z0-9_]*]]:
> +; CHECK:      .long	2147483648
> +; CHECK-NEXT: .long	2147483648
> +; CHECK-NEXT: .long	2147483648
> +; CHECK-NEXT: .long	2147483648
> ; CHECK: test11:
> -; CHECK: pxor
> -; CHECK: pxor
> +; CHECK: movdqa [[CONSTSEG]], [[CONSTREG:%xmm[0-9]*]]
> +; CHECK: pxor [[CONSTREG]]
> +; CHECK: pxor [[CONSTREG]]
> ; CHECK: pcmpgtd %xmm1
> ; CHECK: pshufd $-96
> ; CHECK: pcmpeqd
> 
> 
> _______________________________________________
> llvm-commits mailing list
> llvm-commits at cs.uiuc.edu
> http://lists.cs.uiuc.edu/mailman/listinfo/llvm-commits





More information about the llvm-commits mailing list