[llvm-commits] [llvm] r168227 - in /llvm/trunk: lib/Transforms/Scalar/SROA.cpp test/Transforms/SROA/vector-extract.ll

Fri Nov 16 17:02:17 PST 2012

FYI, this was already reported as a PR. It turns out that there are
several more related bugs like this that make it more complex to solve
than just your patch.

Anyways, I was almost done testing my generalized fix, so I wanted to
give you a heads up that i'll probably replace this with the broader
version (leaving the test case).

On Fri, Nov 16, 2012 at 4:05 PM, Evan Cheng <evan.cheng at apple.com> wrote:
> Author: evancheng
> Date: Fri Nov 16 18:05:06 2012
> New Revision: 168227
>
> URL: http://llvm.org/viewvc/llvm-project?rev=168227&view=rev
> Log:
> Teach SROA rewriteVectorizedStoreInst to handle cases when the loaded value is narrower than the stored value. rdar://12713675
>
> Added:
>     llvm/trunk/test/Transforms/SROA/vector-extract.ll
> Modified:
>     llvm/trunk/lib/Transforms/Scalar/SROA.cpp
>
> Modified: llvm/trunk/lib/Transforms/Scalar/SROA.cpp
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Transforms/Scalar/SROA.cpp?rev=168227&r1=168226&r2=168227&view=diff
> ==============================================================================
> --- llvm/trunk/lib/Transforms/Scalar/SROA.cpp (original)
> +++ llvm/trunk/lib/Transforms/Scalar/SROA.cpp Fri Nov 16 18:05:06 2012
> @@ -2559,18 +2559,55 @@
>      return NewPtr == &NewAI && !LI.isVolatile();
>    }
>
> +  bool rewriteWideStoreInst(IRBuilder<> &IRB, StoreInst &SI, Type *ValueTy,
> +                            unsigned Size) {
> +    assert(!SI.isVolatile());
> +    assert(ValueTy->isIntegerTy() &&
> +           "Only integer type loads and stores are split");
> +    assert(ValueTy->getIntegerBitWidth() ==
> +           TD.getTypeStoreSizeInBits(ValueTy) &&
> +           "Non-byte-multiple bit width");
> +    assert(ValueTy->getIntegerBitWidth() ==
> +           TD.getTypeSizeInBits(OldAI.getAllocatedType()) &&
> +           "Only alloca-wide stores can be split and recomposed");
> +    IntegerType *NarrowTy = Type::getIntNTy(SI.getContext(), Size * 8);
> +    Value *V = extractInteger(TD, IRB, SI.getValueOperand(), NarrowTy,
> +                              BeginOffset, getName(".extract"));
> +    StoreInst *NewSI;
> +    bool IsConvertable = (BeginOffset - NewAllocaBeginOffset == 0) &&
> +      canConvertValue(TD, NarrowTy, NewAllocaTy);
> +    if (IsConvertable)
> +      NewSI = IRB.CreateAlignedStore(convertValue(TD, IRB, V, NewAllocaTy),
> +                                     &NewAI, NewAI.getAlignment());
> +    else
> +      NewSI = IRB.CreateAlignedStore(
> +        V, getAdjustedAllocaPtr(IRB, NarrowTy->getPointerTo()),
> +        getPartitionTypeAlign(NarrowTy));
> +    (void)NewSI;
> +    if (Pass.DeadSplitInsts.insert(&SI))
> +      Pass.DeadInsts.push_back(&SI);
> +
> +    DEBUG(dbgs() << "          to: " << *NewSI << "\n");
> +    return IsConvertable;
> +  }
> +
>    bool rewriteVectorizedStoreInst(IRBuilder<> &IRB, StoreInst &SI,
>                                    Value *OldOp) {
>      Value *V = SI.getValueOperand();
> -    if (V->getType() == ElementTy ||
> +    Type *ValueTy = V->getType();
> +    if (ValueTy == ElementTy ||
>          BeginOffset > NewAllocaBeginOffset || EndOffset < NewAllocaEndOffset) {
> -      if (V->getType() != ElementTy)
> +      if (ValueTy != ElementTy)
>          V = convertValue(TD, IRB, V, ElementTy);
>        LoadInst *LI = IRB.CreateAlignedLoad(&NewAI, NewAI.getAlignment(),
>                                             getName(".load"));
>        V = IRB.CreateInsertElement(LI, V, getIndex(IRB, BeginOffset),
>                                    getName(".insert"));
> -    } else if (V->getType() != VecTy) {
> +    } else if (ValueTy != VecTy) {
> +      uint64_t Size = EndOffset - BeginOffset;
> +      if (Size < TD.getTypeStoreSize(ValueTy))
> +        return rewriteWideStoreInst(IRB, SI, ValueTy, Size);
> +
>        V = convertValue(TD, IRB, V, VecTy);
>      }
>      StoreInst *Store = IRB.CreateAlignedStore(V, &NewAI, NewAI.getAlignment());
> @@ -2613,36 +2650,8 @@
>      Type *ValueTy = SI.getValueOperand()->getType();
>
>      uint64_t Size = EndOffset - BeginOffset;
> -    if (Size < TD.getTypeStoreSize(ValueTy)) {
> -      assert(!SI.isVolatile());
> -      assert(ValueTy->isIntegerTy() &&
> -             "Only integer type loads and stores are split");
> -      assert(ValueTy->getIntegerBitWidth() ==
> -             TD.getTypeStoreSizeInBits(ValueTy) &&
> -             "Non-byte-multiple bit width");
> -      assert(ValueTy->getIntegerBitWidth() ==
> -             TD.getTypeSizeInBits(OldAI.getAllocatedType()) &&
> -             "Only alloca-wide stores can be split and recomposed");
> -      IntegerType *NarrowTy = Type::getIntNTy(SI.getContext(), Size * 8);
> -      Value *V = extractInteger(TD, IRB, SI.getValueOperand(), NarrowTy,
> -                                BeginOffset, getName(".extract"));
> -      StoreInst *NewSI;
> -      bool IsConvertable = (BeginOffset - NewAllocaBeginOffset == 0) &&
> -                           canConvertValue(TD, NarrowTy, NewAllocaTy);
> -      if (IsConvertable)
> -        NewSI = IRB.CreateAlignedStore(convertValue(TD, IRB, V, NewAllocaTy),
> -                                       &NewAI, NewAI.getAlignment());
> -      else
> -        NewSI = IRB.CreateAlignedStore(
> -          V, getAdjustedAllocaPtr(IRB, NarrowTy->getPointerTo()),
> -          getPartitionTypeAlign(NarrowTy));
> -      (void)NewSI;
> -      if (Pass.DeadSplitInsts.insert(&SI))
> -        Pass.DeadInsts.push_back(&SI);
> -
> -      DEBUG(dbgs() << "          to: " << *NewSI << "\n");
> -      return IsConvertable;
> -    }
> +    if (Size < TD.getTypeStoreSize(ValueTy))
> +      return rewriteWideStoreInst(IRB, SI, ValueTy, Size);
>
>      if (IntTy && ValueTy->isIntegerTy())
>        return rewriteIntegerStore(IRB, SI);
>
> Added: llvm/trunk/test/Transforms/SROA/vector-extract.ll
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/Transforms/SROA/vector-extract.ll?rev=168227&view=auto
> ==============================================================================
> --- llvm/trunk/test/Transforms/SROA/vector-extract.ll (added)
> +++ llvm/trunk/test/Transforms/SROA/vector-extract.ll Fri Nov 16 18:05:06 2012
> @@ -0,0 +1,25 @@
> +; RUN: opt < %s -sroa -S | FileCheck %s
> +; rdar://12713675
> +
> +target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
> +
> +define <2 x i16> @test1(i64 %x) nounwind ssp {
> +; CHECK: @test1
> +entry:
> +  %tmp = alloca i64, align 8
> +  br i1 undef, label %bb1, label %bb2
> +; CHECK-NOT: alloca
> +
> +bb1:
> +  store i64 %x, i64* %tmp, align 8
> +; CHECK-NOT: store
> +  %0 = bitcast i64* %tmp to <2 x i16>*
> +  %1 = load <2 x i16>* %0, align 8
> +; CHECK-NOT: load
> +; CHECK: trunc i64 %x to i32
> +; CHECK: bitcast i32
> +  ret <2 x i16> %1
> +
> +bb2:
> +  ret <2 x i16> < i16 0, i16 0 >
> +}
>
>
> _______________________________________________
> llvm-commits mailing list
> llvm-commits at cs.uiuc.edu
> http://lists.cs.uiuc.edu/mailman/listinfo/llvm-commits