[llvm] r212640 - Add trunc (select c, a, b) -> select c (trunc a), (trunc b) combine.

Matt Arsenault Matthew.Arsenault at amd.com
Thu Jul 10 11:15:02 PDT 2014


On 07/10/2014 05:41 AM, NAKAMURA Takumi wrote:
> Matt, excuse me, I have reverted it in r212708.
>
> SExting caused miscompilation on, at least, x86-64.
>
> // Minimal testcase to miscompile.
> unsigned foo(unsigned a, bool cc) {
>    return a << (cc ? 3 : 2);
> }
>
> define i32 @_Z3foojb(i32 %a, i1 zeroext %cc) #0 {
>    %1 = select i1 %cc, i32 3, i32 2
>    %2 = shl i32 %a, %1
>    ret i32 %2
> }
>
> I could appease miscompilation like;
>
> --- a/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
> +++ b/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
> @@ -6030,8 +6030,7 @@ SDValue DAGCombiner::visitTRUNCATE(SDNode *N) {
>         SDLoc SL(N0);
>         SDValue TruncOp0 = DAG.getNode(ISD::TRUNCATE, SL, VT, N0.getOperand(1));
>         SDValue TruncOp1 = DAG.getNode(ISD::TRUNCATE, SL, VT, N0.getOperand(2));
> -      EVT SetCCVT = getSetCCResultType(VT);
> -      SDValue Cond = DAG.getSExtOrTrunc(N0.getOperand(0), SL, SetCCVT);
> +      SDValue Cond = N0.getOperand(0);
>         return DAG.getNode(ISD::SELECT, SDLoc(N), VT, Cond, TruncOp0, TruncOp1);
>       }
>     }
>
> But I thought I might revert yours for now.
> I guess you intended architectures that have bitwise bsel. I think it
> would be unsuitable to x86 ALU.

The conversion was because on my target, the select condition type is 
supposed to be the same width as the selected type. I think just passing 
it through will work, since I think it's OK if the select mask type is 
wider. I'll resubmit it with your fix.

>
> 2014-07-10 4:12 GMT+09:00 Matt Arsenault <Matthew.Arsenault at amd.com>:
>> Author: arsenm
>> Date: Wed Jul  9 14:12:07 2014
>> New Revision: 212640
>>
>> URL: http://llvm.org/viewvc/llvm-project?rev=212640&view=rev
>> Log:
>> Add trunc (select c, a, b) -> select c (trunc a), (trunc b) combine.
>>
>> Do this if the truncate is free and the select is legal.
>>
>> Modified:
>>      llvm/trunk/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
>>      llvm/trunk/test/CodeGen/R600/select64.ll
>>      llvm/trunk/test/CodeGen/X86/shift-parts.ll
>>
>> Modified: llvm/trunk/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
>> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/CodeGen/SelectionDAG/DAGCombiner.cpp?rev=212640&r1=212639&r2=212640&view=diff
>> ==============================================================================
>> --- llvm/trunk/lib/CodeGen/SelectionDAG/DAGCombiner.cpp (original)
>> +++ llvm/trunk/lib/CodeGen/SelectionDAG/DAGCombiner.cpp Wed Jul  9 14:12:07 2014
>> @@ -6013,6 +6013,20 @@ SDValue DAGCombiner::visitTRUNCATE(SDNod
>>       }
>>     }
>>
>> +  // trunc (select c, a, b) -> select c, (trunc a), (trunc b)
>> +  if (N0.getOpcode() == ISD::SELECT) {
>> +    EVT SrcVT = N0.getValueType();
>> +    if ((!LegalOperations || TLI.isOperationLegal(ISD::SELECT, SrcVT)) &&
>> +        TLI.isTruncateFree(SrcVT, VT)) {
>> +      SDLoc SL(N0);
>> +      SDValue TruncOp0 = DAG.getNode(ISD::TRUNCATE, SL, VT, N0.getOperand(1));
>> +      SDValue TruncOp1 = DAG.getNode(ISD::TRUNCATE, SL, VT, N0.getOperand(2));
>> +      EVT SetCCVT = getSetCCResultType(VT);
>> +      SDValue Cond = DAG.getSExtOrTrunc(N0.getOperand(0), SL, SetCCVT);
>> +      return DAG.getNode(ISD::SELECT, SDLoc(N), VT, Cond, TruncOp0, TruncOp1);
>> +    }
>> +  }
>> +
>>     // Fold a series of buildvector, bitcast, and truncate if possible.
>>     // For example fold
>>     //   (2xi32 trunc (bitcast ((4xi32)buildvector x, x, y, y) 2xi64)) to
>>
>> Modified: llvm/trunk/test/CodeGen/R600/select64.ll
>> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/R600/select64.ll?rev=212640&r1=212639&r2=212640&view=diff
>> ==============================================================================
>> --- llvm/trunk/test/CodeGen/R600/select64.ll (original)
>> +++ llvm/trunk/test/CodeGen/R600/select64.ll Wed Jul  9 14:12:07 2014
>> @@ -13,3 +13,38 @@ entry:
>>     store i64 %1, i64 addrspace(1)* %out
>>     ret void
>>   }
>> +
>> +; CHECK-LABEL: @select_trunc_i64
>> +; CHECK: V_CNDMASK_B32
>> +; CHECK-NOT: V_CNDMASK_B32
>> +define void @select_trunc_i64(i32 addrspace(1)* %out, i32 %cond, i64 %in) nounwind {
>> +  %cmp = icmp ugt i32 %cond, 5
>> +  %sel = select i1 %cmp, i64 0, i64 %in
>> +  %trunc = trunc i64 %sel to i32
>> +  store i32 %trunc, i32 addrspace(1)* %out, align 4
>> +  ret void
>> +}
>> +
>> +; CHECK-LABEL: @select_trunc_i64_2
>> +; CHECK: V_CNDMASK_B32
>> +; CHECK-NOT: V_CNDMASK_B32
>> +define void @select_trunc_i64_2(i32 addrspace(1)* %out, i32 %cond, i64 %a, i64 %b) nounwind {
>> +  %cmp = icmp ugt i32 %cond, 5
>> +  %sel = select i1 %cmp, i64 %a, i64 %b
>> +  %trunc = trunc i64 %sel to i32
>> +  store i32 %trunc, i32 addrspace(1)* %out, align 4
>> +  ret void
>> +}
>> +
>> +; CHECK-LABEL: @v_select_trunc_i64_2
>> +; CHECK: V_CNDMASK_B32
>> +; CHECK-NOT: V_CNDMASK_B32
>> +define void @v_select_trunc_i64_2(i32 addrspace(1)* %out, i32 %cond, i64 addrspace(1)* %aptr, i64 addrspace(1)* %bptr) nounwind {
>> +  %cmp = icmp ugt i32 %cond, 5
>> +  %a = load i64 addrspace(1)* %aptr, align 8
>> +  %b = load i64 addrspace(1)* %bptr, align 8
>> +  %sel = select i1 %cmp, i64 %a, i64 %b
>> +  %trunc = trunc i64 %sel to i32
>> +  store i32 %trunc, i32 addrspace(1)* %out, align 4
>> +  ret void
>> +}
>>
>> Modified: llvm/trunk/test/CodeGen/X86/shift-parts.ll
>> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/X86/shift-parts.ll?rev=212640&r1=212639&r2=212640&view=diff
>> ==============================================================================
>> --- llvm/trunk/test/CodeGen/X86/shift-parts.ll (original)
>> +++ llvm/trunk/test/CodeGen/X86/shift-parts.ll Wed Jul  9 14:12:07 2014
>> @@ -1,17 +1,19 @@
>> -; RUN: llc < %s -march=x86-64 | grep shrdq
>> +; RUN: llc -march=x86-64 < %s | FileCheck %s
>>   ; PR4736
>>
>>   %0 = type { i32, i8, [35 x i8] }
>>
>>   @g_144 = external global %0, align 8              ; <%0*> [#uses=1]
>>
>> -define i32 @int87(i32 %uint64p_8) nounwind {
>> +; CHECK: shrdq
>> +
>> +define i32 @int87(i32 %uint64p_8, i1 %cond) nounwind {
>>   entry:
>>     %srcval4 = load i320* bitcast (%0* @g_144 to i320*), align 8 ; <i320> [#uses=1]
>>     br label %for.cond
>>
>>   for.cond:                                         ; preds = %for.cond, %entry
>> -  %call3.in.in.in.v = select i1 undef, i320 192, i320 128 ; <i320> [#uses=1]
>> +  %call3.in.in.in.v = select i1 %cond, i320 192, i320 128 ; <i320> [#uses=1]
>>     %call3.in.in.in = lshr i320 %srcval4, %call3.in.in.in.v ; <i320> [#uses=1]
>>     %call3.in = trunc i320 %call3.in.in.in to i32   ; <i32> [#uses=1]
>>     %tobool = icmp eq i32 %call3.in, 0              ; <i1> [#uses=1]
>>
>>
>> _______________________________________________
>> llvm-commits mailing list
>> llvm-commits at cs.uiuc.edu
>> http://lists.cs.uiuc.edu/mailman/listinfo/llvm-commits




More information about the llvm-commits mailing list