[PATCH] D97035: [AArch64][GlobalISel] Support lowering <1 x i8> arguments and returning
Amara Emerson via Phabricator via llvm-commits
llvm-commits at lists.llvm.org
Thu Feb 18 23:15:42 PST 2021
aemerson created this revision.
aemerson added reviewers: paquette, arsenm.
aemerson added a project: LLVM.
Herald added subscribers: danielkiss, hiraditya, kristof.beyls, rovka.
aemerson requested review of this revision.
Herald added a subscriber: wdng.
We don't yet have working codegen for the resulting unmerge/merges, and if we did it would probably be horrible.
Repository:
rG LLVM Github Monorepo
https://reviews.llvm.org/D97035
Files:
llvm/lib/CodeGen/GlobalISel/CallLowering.cpp
llvm/lib/Target/AArch64/GISel/AArch64CallLowering.cpp
llvm/test/CodeGen/AArch64/GlobalISel/call-lowering-vectors.ll
Index: llvm/test/CodeGen/AArch64/GlobalISel/call-lowering-vectors.ll
===================================================================
--- /dev/null
+++ llvm/test/CodeGen/AArch64/GlobalISel/call-lowering-vectors.ll
@@ -0,0 +1,18 @@
+; NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
+; RUN: llc -mtriple=aarch64-linux-gnu -O0 -stop-after=irtranslator -global-isel -verify-machineinstrs %s -o - 2>&1 | FileCheck %s
+
+define <1 x i8> @v1s8_add(<1 x i8> %a0) nounwind {
+ ; CHECK-LABEL: name: v1s8_add
+ ; CHECK: bb.1 (%ir-block.0):
+ ; CHECK: liveins: $d0
+ ; CHECK: [[COPY:%[0-9]+]]:_(<8 x s8>) = COPY $d0
+ ; CHECK: [[UV:%[0-9]+]]:_(s8), [[UV1:%[0-9]+]]:_(s8), [[UV2:%[0-9]+]]:_(s8), [[UV3:%[0-9]+]]:_(s8), [[UV4:%[0-9]+]]:_(s8), [[UV5:%[0-9]+]]:_(s8), [[UV6:%[0-9]+]]:_(s8), [[UV7:%[0-9]+]]:_(s8) = G_UNMERGE_VALUES [[COPY]](<8 x s8>)
+ ; CHECK: [[COPY1:%[0-9]+]]:_(s8) = COPY [[UV]](s8)
+ ; CHECK: [[ADD:%[0-9]+]]:_(s8) = G_ADD [[COPY1]], [[COPY1]]
+ ; CHECK: [[DEF:%[0-9]+]]:_(s8) = G_IMPLICIT_DEF
+ ; CHECK: [[BUILD_VECTOR:%[0-9]+]]:_(<8 x s8>) = G_BUILD_VECTOR [[ADD]](s8), [[DEF]](s8), [[DEF]](s8), [[DEF]](s8), [[DEF]](s8), [[DEF]](s8), [[DEF]](s8), [[DEF]](s8)
+ ; CHECK: $d0 = COPY [[BUILD_VECTOR]](<8 x s8>)
+ ; CHECK: RET_ReallyLR implicit $d0
+ %res = add <1 x i8> %a0, %a0
+ ret <1 x i8> %res
+}
Index: llvm/lib/Target/AArch64/GISel/AArch64CallLowering.cpp
===================================================================
--- llvm/lib/Target/AArch64/GISel/AArch64CallLowering.cpp
+++ llvm/lib/Target/AArch64/GISel/AArch64CallLowering.cpp
@@ -378,18 +378,15 @@
CurVReg = MIRBuilder.buildInstr(ExtendOp, {NewLLT}, {CurVReg})
.getReg(0);
}
- } else if (NewLLT.getNumElements() == 2) {
- // We need to pad a <1 x S> type to <2 x S>. Since we don't have
+ } else {
+ // We need to pad a <1 x S> type to <N x S>. Since we don't have
// <1 x S> vector types in GISel we use a build_vector instead
// of a vector merge/concat.
auto Undef = MIRBuilder.buildUndef({OldLLT});
- CurVReg =
- MIRBuilder
- .buildBuildVector({NewLLT}, {CurVReg, Undef.getReg(0)})
- .getReg(0);
- } else {
- LLVM_DEBUG(dbgs() << "Could not handle ret ty");
- return false;
+ SmallVector<Register, 4> Srcs = {CurVReg};
+ for (unsigned Idx = 0; Idx < NewLLT.getNumElements() - 1; ++Idx)
+ Srcs.push_back(Undef.getReg(0));
+ CurVReg = MIRBuilder.buildBuildVector({NewLLT}, Srcs).getReg(0);
}
} else {
// A scalar extend.
Index: llvm/lib/CodeGen/GlobalISel/CallLowering.cpp
===================================================================
--- llvm/lib/CodeGen/GlobalISel/CallLowering.cpp
+++ llvm/lib/CodeGen/GlobalISel/CallLowering.cpp
@@ -545,13 +545,18 @@
// or do an unmerge to get the lower block of elements.
if (VATy.isVector() &&
VATy.getNumElements() > OrigVT.getVectorNumElements()) {
- // Just handle the case where the VA type is 2 * original type.
- if (VATy.getNumElements() != OrigVT.getVectorNumElements() * 2) {
- LLVM_DEBUG(dbgs()
- << "Incoming promoted vector arg has too many elts");
+ // Just handle the case where the VA type is a multiple original type.
+ if (VATy.getNumElements() % OrigVT.getVectorNumElements() != 0) {
+ LLVM_DEBUG(dbgs() << "Incoming promoted vector arg elts is not a "
+ "multiple of orig type elt");
return false;
}
- auto Unmerge = MIRBuilder.buildUnmerge({OrigTy, OrigTy}, {NewReg});
+ SmallVector<LLT, 4> DstTys;
+ unsigned NumParts =
+ VATy.getNumElements() / OrigVT.getVectorNumElements();
+ for (unsigned Idx = 0; Idx < NumParts; ++Idx)
+ DstTys.push_back(OrigTy);
+ auto Unmerge = MIRBuilder.buildUnmerge(DstTys, {NewReg});
MIRBuilder.buildCopy(ArgReg, Unmerge.getReg(0));
} else {
MIRBuilder.buildTrunc(ArgReg, {NewReg}).getReg(0);
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D97035.324891.patch
Type: text/x-patch
Size: 4308 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/llvm-commits/attachments/20210219/6dd15e8a/attachment.bin>
More information about the llvm-commits
mailing list