[llvm] dcccb2f - [PowerPC] Fix bswap combine for big endian systems
Nemanja Ivanovic via llvm-commits
llvm-commits at lists.llvm.org
Thu Jun 24 16:28:15 PDT 2021
Author: Nemanja Ivanovic
Date: 2021-06-24T18:04:50-05:00
New Revision: dcccb2f59401f309d75b9d80afed443464c50d9d
URL: https://github.com/llvm/llvm-project/commit/dcccb2f59401f309d75b9d80afed443464c50d9d
DIFF: https://github.com/llvm/llvm-project/commit/dcccb2f59401f309d75b9d80afed443464c50d9d.diff
LOG: [PowerPC] Fix bswap combine for big endian systems
Commit 0464586ac515e8cfebe4c7615387fd625c8869f5 added a combine
for a 64-bit load feeding a bswap but the implementation is only
correct for little endian systems.
This fixes it for big endian systems.
Added:
Modified:
llvm/lib/Target/PowerPC/PPCISelLowering.cpp
llvm/test/CodeGen/PowerPC/bswap-load-store.ll
llvm/test/CodeGen/PowerPC/ld-bswap64-no-ldbrx.ll
Removed:
################################################################################
diff --git a/llvm/lib/Target/PowerPC/PPCISelLowering.cpp b/llvm/lib/Target/PowerPC/PPCISelLowering.cpp
index 5cb4470e0427..f2bc01bc6d9e 100644
--- a/llvm/lib/Target/PowerPC/PPCISelLowering.cpp
+++ b/llvm/lib/Target/PowerPC/PPCISelLowering.cpp
@@ -15262,7 +15262,11 @@ SDValue PPCTargetLowering::PerformDAGCombine(SDNode *N,
SDValue Hi = DAG.getLoad(MVT::i32, dl, LD->getChain(), BasePtr,
LD->getPointerInfo(), LD->getAlignment());
Hi = DAG.getNode(ISD::BSWAP, dl, MVT::i32, Hi);
- SDValue Res = DAG.getNode(ISD::BUILD_PAIR, dl, MVT::i64, Hi, Lo);
+ SDValue Res;
+ if (Subtarget.isLittleEndian())
+ Res = DAG.getNode(ISD::BUILD_PAIR, dl, MVT::i64, Hi, Lo);
+ else
+ Res = DAG.getNode(ISD::BUILD_PAIR, dl, MVT::i64, Lo, Hi);
SDValue TF =
DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
Hi.getOperand(0).getValue(1), Lo.getOperand(0).getValue(1));
diff --git a/llvm/test/CodeGen/PowerPC/bswap-load-store.ll b/llvm/test/CodeGen/PowerPC/bswap-load-store.ll
index e21f810040d3..0c9b7a709451 100644
--- a/llvm/test/CodeGen/PowerPC/bswap-load-store.ll
+++ b/llvm/test/CodeGen/PowerPC/bswap-load-store.ll
@@ -151,11 +151,12 @@ define i64 @LDBRX(i8* %ptr, i64 %off) {
;
; X64-LABEL: LDBRX:
; X64: # %bb.0:
-; X64-NEXT: li r5, 4
-; X64-NEXT: lwbrx r6, r3, r4
+; X64-NEXT: li r6, 4
+; X64-NEXT: lwbrx r5, r3, r4
; X64-NEXT: add r3, r3, r4
-; X64-NEXT: lwbrx r3, r3, r5
-; X64-NEXT: rldimi r3, r6, 32, 0
+; X64-NEXT: lwbrx r3, r3, r6
+; X64-NEXT: rldimi r5, r3, 32, 0
+; X64-NEXT: mr r3, r5
; X64-NEXT: blr
;
; PWR7_64-LABEL: LDBRX:
diff --git a/llvm/test/CodeGen/PowerPC/ld-bswap64-no-ldbrx.ll b/llvm/test/CodeGen/PowerPC/ld-bswap64-no-ldbrx.ll
index 27e7c7b73afa..d8889cd7c791 100644
--- a/llvm/test/CodeGen/PowerPC/ld-bswap64-no-ldbrx.ll
+++ b/llvm/test/CodeGen/PowerPC/ld-bswap64-no-ldbrx.ll
@@ -7,8 +7,8 @@ define void @bs(i64* %p) {
; CHECK-NEXT: li 4, 4
; CHECK-NEXT: lwbrx 5, 0, 3
; CHECK-NEXT: lwbrx 4, 3, 4
-; CHECK-NEXT: rldimi 4, 5, 32, 0
-; CHECK-NEXT: std 4, 0(3)
+; CHECK-NEXT: rldimi 5, 4, 32, 0
+; CHECK-NEXT: std 5, 0(3)
; CHECK-NEXT: blr
%x = load i64, i64* %p, align 8
%b = call i64 @llvm.bswap.i64(i64 %x)
@@ -42,9 +42,9 @@ define i64 @misaligned_ld(i64* %p) {
; CHECK-LABEL: misaligned_ld:
; CHECK: # %bb.0:
; CHECK-NEXT: li 4, 4
-; CHECK-NEXT: lwbrx 5, 0, 3
-; CHECK-NEXT: lwbrx 3, 3, 4
-; CHECK-NEXT: rldimi 3, 5, 32, 0
+; CHECK-NEXT: lwbrx 4, 3, 4
+; CHECK-NEXT: lwbrx 3, 0, 3
+; CHECK-NEXT: rldimi 3, 4, 32, 0
; CHECK-NEXT: blr
%x = load i64, i64* %p, align 1
%b = call i64 @llvm.bswap.i64(i64 %x)
More information about the llvm-commits
mailing list