[PATCH] D91512: [AArch64][Isel] Avoid implicit zext for SIGN_EXTEND_INREG ( TRUNCATE )
guopeilin via Phabricator via llvm-commits
llvm-commits at lists.llvm.org
Sun Nov 15 19:17:38 PST 2020
guopeilin created this revision.
Herald added subscribers: llvm-commits, danielkiss, hiraditya, kristof.beyls.
Herald added a project: LLVM.
guopeilin requested review of this revision.
In some cases, AArch64 use SBFMXri + COPY to implement "sign_extend_inreg (truncate)", However COPY is usually erased after Register Coalescing, so if we want to zext this result, we need to avoid using implicit zero-extend.
Repository:
rG LLVM Github Monorepo
https://reviews.llvm.org/D91512
Files:
llvm/lib/Target/AArch64/AArch64ISelLowering.h
llvm/test/CodeGen/AArch64/aarch64-avoid-implicit-zext-for-SIGN_EXTEND_INREG.ll
Index: llvm/test/CodeGen/AArch64/aarch64-avoid-implicit-zext-for-SIGN_EXTEND_INREG.ll
===================================================================
--- /dev/null
+++ llvm/test/CodeGen/AArch64/aarch64-avoid-implicit-zext-for-SIGN_EXTEND_INREG.ll
@@ -0,0 +1,28 @@
+; RUN: llc -O3 -mtriple=aarch64-unknown-linux-gnu < %s | FileCheck %s
+ at b = dso_local local_unnamed_addr global { [3 x i8], i8, i8, i8, i8, i8 } { [3 x i8] undef, i8 -64, i8 74, i8 -9, i8 -1, i8 7 }, align 8
+ at c = common dso_local local_unnamed_addr global i64 0, align 8
+ at .str = private unnamed_addr constant [9 x i8] c"c = %ld\0A\00", align 1
+
+define dso_local i8 @d(i64 %h) local_unnamed_addr {
+entry:
+ ret i8 undef
+}
+
+declare dso_local i32 @printf(i8* nocapture readonly, ...) local_unnamed_addr
+
+define dso_local i32 @main() local_unnamed_addr {
+entry:
+ %bf.load = load i64, i64* bitcast ({ [3 x i8], i8, i8, i8, i8, i8 }* @b to i64*), align 8
+ %0 = lshr i64 %bf.load, 30
+ %sext3 = shl nuw nsw i64 %0, 16
+ %sext = trunc i64 %sext3 to i32
+ %conv.i = ashr exact i32 %sext, 16
+ %conv.i.i = zext i32 %conv.i to i64
+; CHECK: // %bb.0:
+; CHECK: sbfx x{{[0-9]+}}, x{{[0-9]+}}, #{{[0-9]+}}, #{{[0-9]+}}
+; CHECK-NEXT: mov w{{[0-9]+}}, w{{[0-9]+}}
+ store i64 %conv.i.i, i64* @c, align 8
+ %call.i.i = tail call i32 (i8*, ...) @printf(i8* nonnull dereferenceable(1) getelementptr inbounds ([9 x i8], [9 x i8]* @.str, i64 0, i64 0), i64 %conv.i.i)
+ %call4.i = tail call i8 bitcast (i8 (i64)* @d to i8 (i32, i32)*)(i32 0, i32 %conv.i)
+ ret i32 0
+}
Index: llvm/lib/Target/AArch64/AArch64ISelLowering.h
===================================================================
--- llvm/lib/Target/AArch64/AArch64ISelLowering.h
+++ llvm/lib/Target/AArch64/AArch64ISelLowering.h
@@ -432,6 +432,12 @@
// FIXME: X86 also checks for CMOV here. Do we need something similar?
static inline bool isDef32(const SDNode &N) {
unsigned Opc = N.getOpcode();
+
+ if (Opc == ISD::SIGN_EXTEND_INREG) {
+ SDValue Opr = N.getOperand(0);
+ return Opr->getOpcode() != ISD::TRUNCATE;
+ }
+
return Opc != ISD::TRUNCATE && Opc != TargetOpcode::EXTRACT_SUBREG &&
Opc != ISD::CopyFromReg && Opc != ISD::AssertSext &&
Opc != ISD::AssertZext;
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D91512.305402.patch
Type: text/x-patch
Size: 2263 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/llvm-commits/attachments/20201116/0c9d064f/attachment.bin>
More information about the llvm-commits
mailing list