[llvm] 9518f03 - [Hexagon] When widening truncate result, also widen operand if necessary

Sat Sep 5 16:19:49 PDT 2020

Author: Krzysztof Parzyszek
Date: 2020-09-05T18:19:32-05:00
New Revision: 9518f032e49280d973dcae9e1ff460b1f98cc9df

URL: https://github.com/llvm/llvm-project/commit/9518f032e49280d973dcae9e1ff460b1f98cc9df
DIFF: https://github.com/llvm/llvm-project/commit/9518f032e49280d973dcae9e1ff460b1f98cc9df.diff

LOG: [Hexagon] When widening truncate result, also widen operand if necessary

Added: 
    llvm/test/CodeGen/Hexagon/autohvx/isel-widen-truncate-op.ll

Modified: 
    llvm/lib/Target/Hexagon/HexagonISelLoweringHVX.cpp

Removed: 
    


################################################################################
diff  --git a/llvm/lib/Target/Hexagon/HexagonISelLoweringHVX.cpp b/llvm/lib/Target/Hexagon/HexagonISelLoweringHVX.cpp
index a2420dae8aff..604d13ee874b 100644

--- a/llvm/lib/Target/Hexagon/HexagonISelLoweringHVX.cpp
+++ b/llvm/lib/Target/Hexagon/HexagonISelLoweringHVX.cpp
@@ -1918,16 +1918,32 @@ HexagonTargetLowering::WidenHvxStore(SDValue Op, SelectionDAG &DAG) const {
 SDValue
 HexagonTargetLowering::WidenHvxTruncate(SDValue Op, SelectionDAG &DAG) const {
   const SDLoc &dl(Op);
-  MVT ResTy = ty(Op);
   unsigned HwWidth = 8*Subtarget.getVectorLength();
-  unsigned ResWidth = ResTy.getSizeInBits();
-  assert(HwWidth % ResWidth == 0);
-
-  unsigned WideNumElem = ResTy.getVectorNumElements() * (HwWidth / ResWidth);
-  MVT WideTy = MVT::getVectorVT(ResTy.getVectorElementType(), WideNumElem);
-  SDValue WideOp = DAG.getNode(HexagonISD::VPACKL, dl, WideTy,
-                               Op.getOperand(0));
-  return WideOp;
+
+  auto getFactor = [HwWidth](MVT Ty) {
+    unsigned Width = Ty.getSizeInBits();
+    assert(HwWidth % Width == 0);
+    return HwWidth / Width;
+  };
+
+  auto getWideTy = [getFactor](MVT Ty) {
+    unsigned WideLen = Ty.getVectorNumElements() * getFactor(Ty);
+    return MVT::getVectorVT(Ty.getVectorElementType(), WideLen);
+  };
+
+  SDValue Op0 = Op.getOperand(0);
+  MVT ResTy = ty(Op);
+  MVT OpTy = ty(Op0);
+  if (Subtarget.isHVXVectorType(OpTy))
+    return DAG.getNode(HexagonISD::VPACKL, dl, getWideTy(ResTy), Op0);
+
+  MVT WideOpTy = getWideTy(OpTy);
+  SmallVector<SDValue, 4> Concats = {Op0};
+  for (int i = 0, e = getFactor(OpTy) - 1; i != e; ++i)
+    Concats.push_back(DAG.getUNDEF(OpTy));
+
+  SDValue Cat = DAG.getNode(ISD::CONCAT_VECTORS, dl, WideOpTy, Concats);
+  return DAG.getNode(HexagonISD::VPACKL, dl, getWideTy(ResTy), Cat);
 }
 
 SDValue

diff  --git a/llvm/test/CodeGen/Hexagon/autohvx/isel-widen-truncate-op.ll b/llvm/test/CodeGen/Hexagon/autohvx/isel-widen-truncate-op.ll
new file mode 100644
index 000000000000..404d3d1ff260
--- /dev/null
+++ b/llvm/test/CodeGen/Hexagon/autohvx/isel-widen-truncate-op.ll
@@ -0,0 +1,37 @@
+; RUN: llc -march=hexagon -hexagon-hvx-widen=32 < %s | FileCheck %s
+; RUN: llc -march=hexagon -hexagon-hvx-widen=16 < %s | FileCheck %s
+
+; Check for successful compilation.
+; CHECK-LABEL: f0:
+; CHECK: vmemu
+
+target datalayout = "e-m:e-p:32:32:32-a:0-n16:32-i64:64:64-i32:32:32-i16:16:16-i1:8:8-f32:32:32-f64:64:64-v32:32:32-v64:64:64-v512:512:512-v1024:1024:1024-v2048:2048:2048"
+target triple = "hexagon"
+
+define dso_local void @f0(i16* %a0) local_unnamed_addr #0 {
+b0:
+  %v0 = getelementptr i16, i16* %a0, i32 8
+  %v1 = getelementptr i16, i16* %v0, i32 0
+  %v2 = icmp eq i32 0, 0
+  %v3 = insertelement <8 x i1> undef, i1 %v2, i64 0
+  %v4 = shufflevector <8 x i1> %v3, <8 x i1> undef, <8 x i32> zeroinitializer
+  %v5 = call <8 x i32> @llvm.masked.load.v8i32.p0v8i32(<8 x i32>* nonnull undef, i32 4, <8 x i1> %v4, <8 x i32> undef)
+  %v6 = sub nsw <8 x i32> zeroinitializer, %v5
+  %v7 = add nsw <8 x i32> %v6, zeroinitializer
+  %v8 = add <8 x i32> zeroinitializer, %v7
+  %v9 = lshr <8 x i32> %v8, <i32 6, i32 6, i32 6, i32 6, i32 6, i32 6, i32 6, i32 6>
+  %v10 = trunc <8 x i32> %v9 to <8 x i16>
+  %v11 = bitcast i16* %v1 to <8 x i16>*
+  call void @llvm.masked.store.v8i16.p0v8i16(<8 x i16> %v10, <8 x i16>* %v11, i32 2, <8 x i1> %v4)
+  ret void
+}
+
+; Function Attrs: argmemonly nounwind readonly willreturn
+declare <8 x i32> @llvm.masked.load.v8i32.p0v8i32(<8 x i32>*, i32 immarg, <8 x i1>, <8 x i32>) #1
+
+; Function Attrs: argmemonly nounwind willreturn
+declare void @llvm.masked.store.v8i16.p0v8i16(<8 x i16>, <8 x i16>*, i32 immarg, <8 x i1>) #2
+
+attributes #0 = { "target-features"="+hvx-length64b,+hvxv65,+v65,-long-calls,-packets" }
+attributes #1 = { argmemonly nounwind readonly willreturn }
+attributes #2 = { argmemonly nounwind willreturn }