[llvm] cf73a0b - [AArch64] Copy implicit def operands when creating LDP. (#164253)
via llvm-commits
llvm-commits at lists.llvm.org
Tue Nov 4 13:56:02 PST 2025
Author: David Green
Date: 2025-11-04T21:55:57Z
New Revision: cf73a0b102c012f30e5ee43638a78ed21e6b81b3
URL: https://github.com/llvm/llvm-project/commit/cf73a0b102c012f30e5ee43638a78ed21e6b81b3
DIFF: https://github.com/llvm/llvm-project/commit/cf73a0b102c012f30e5ee43638a78ed21e6b81b3.diff
LOG: [AArch64] Copy implicit def operands when creating LDP. (#164253)
Otherwise we might end up with undefined register uses. Copying implicit
uses can cause problems where a register is both defined and used in the
same LDP, so I have not tried to add them here.
Fixes #164230
Added:
llvm/test/CodeGen/AArch64/ldst-implicitop.mir
Modified:
llvm/lib/Target/AArch64/AArch64LoadStoreOptimizer.cpp
Removed:
################################################################################
diff --git a/llvm/lib/Target/AArch64/AArch64LoadStoreOptimizer.cpp b/llvm/lib/Target/AArch64/AArch64LoadStoreOptimizer.cpp
index e69fa32967a79..2ab7bf19da410 100644
--- a/llvm/lib/Target/AArch64/AArch64LoadStoreOptimizer.cpp
+++ b/llvm/lib/Target/AArch64/AArch64LoadStoreOptimizer.cpp
@@ -1386,6 +1386,25 @@ AArch64LoadStoreOpt::mergePairedInsns(MachineBasicBlock::iterator I,
if (MOP.isReg() && MOP.isKill())
DefinedInBB.addReg(MOP.getReg());
+ // Copy over any implicit-def operands. This is like MI.copyImplicitOps, but
+ // only copies implicit defs and makes sure that each operand is only added
+ // once in case of duplicates.
+ auto CopyImplicitOps = [&](MachineBasicBlock::iterator MI1,
+ MachineBasicBlock::iterator MI2) {
+ SmallSetVector<Register, 4> Ops;
+ for (const MachineOperand &MO :
+ llvm::drop_begin(MI1->operands(), MI1->getDesc().getNumOperands()))
+ if (MO.isReg() && MO.isImplicit() && MO.isDef())
+ Ops.insert(MO.getReg());
+ for (const MachineOperand &MO :
+ llvm::drop_begin(MI2->operands(), MI2->getDesc().getNumOperands()))
+ if (MO.isReg() && MO.isImplicit() && MO.isDef())
+ Ops.insert(MO.getReg());
+ for (auto Op : Ops)
+ MIB.addDef(Op, RegState::Implicit);
+ };
+ CopyImplicitOps(I, Paired);
+
// Erase the old instructions.
I->eraseFromParent();
Paired->eraseFromParent();
diff --git a/llvm/test/CodeGen/AArch64/ldst-implicitop.mir b/llvm/test/CodeGen/AArch64/ldst-implicitop.mir
new file mode 100644
index 0000000000000..34e8cf282669c
--- /dev/null
+++ b/llvm/test/CodeGen/AArch64/ldst-implicitop.mir
@@ -0,0 +1,80 @@
+# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py UTC_ARGS: --version 6
+# RUN: llc -mtriple=aarch64-- -run-pass=aarch64-ldst-opt -verify-machineinstrs -o - %s | FileCheck %s
+# Check that we copy implicit operands.
+---
+name: impdef_op1
+tracksRegLiveness: true
+body: |
+ bb.0:
+ liveins: $lr
+ ; CHECK-LABEL: name: impdef_op1
+ ; CHECK: liveins: $lr
+ ; CHECK-NEXT: {{ $}}
+ ; CHECK-NEXT: renamable $q5, renamable $q20 = LDPQi renamable $lr, 3, implicit-def $q4_q5 :: (load (s128))
+ ; CHECK-NEXT: $q0 = ORRv16i8 $q4, killed $q4
+ ; CHECK-NEXT: $q1 = ORRv16i8 $q5, killed $q5
+ ; CHECK-NEXT: RET_ReallyLR
+ renamable $q5 = LDRQui renamable $lr, 3, implicit-def $q4_q5 :: (load (s128))
+ renamable $q20 = LDRQui renamable $lr, 4 :: (load (s128))
+ $q0 = ORRv16i8 $q4, killed $q4
+ $q1 = ORRv16i8 $q5, killed $q5
+ RET_ReallyLR
+...
+---
+name: impdef_op2
+body: |
+ bb.0:
+ liveins: $lr
+ ; CHECK-LABEL: name: impdef_op2
+ ; CHECK: liveins: $lr
+ ; CHECK-NEXT: {{ $}}
+ ; CHECK-NEXT: renamable $q20, renamable $q5 = LDPQi renamable $lr, 3, implicit-def $q4_q5 :: (load (s128))
+ ; CHECK-NEXT: $q0 = ORRv16i8 $q4, killed $q4
+ ; CHECK-NEXT: $q1 = ORRv16i8 $q5, killed $q5
+ ; CHECK-NEXT: RET_ReallyLR
+ renamable $q20 = LDRQui renamable $lr, 3 :: (load (s128))
+ renamable $q5 = LDRQui renamable $lr, 4, implicit-def $q4_q5 :: (load (s128))
+ $q0 = ORRv16i8 $q4, killed $q4
+ $q1 = ORRv16i8 $q5, killed $q5
+ RET_ReallyLR
+...
+---
+name: impdef_both
+body: |
+ bb.0:
+ liveins: $lr
+ ; CHECK-LABEL: name: impdef_both
+ ; CHECK: liveins: $lr
+ ; CHECK-NEXT: {{ $}}
+ ; CHECK-NEXT: renamable $q5, renamable $q20 = LDPQi renamable $lr, 3, implicit-def $q4_q5, implicit-def $q20_q21 :: (load (s128))
+ ; CHECK-NEXT: $q0 = ORRv16i8 $q4, killed $q4
+ ; CHECK-NEXT: $q1 = ORRv16i8 $q5, killed $q5
+ ; CHECK-NEXT: $q2 = ORRv16i8 $q20, killed $q20
+ ; CHECK-NEXT: $q3 = ORRv16i8 $q21, killed $q21
+ ; CHECK-NEXT: RET_ReallyLR
+ renamable $q5 = LDRQui renamable $lr, 3, implicit-def $q4_q5 :: (load (s128))
+ renamable $q20 = LDRQui renamable $lr, 4, implicit-def $q20_q21 :: (load (s128))
+ $q0 = ORRv16i8 $q4, killed $q4
+ $q1 = ORRv16i8 $q5, killed $q5
+ $q2 = ORRv16i8 $q20, killed $q20
+ $q3 = ORRv16i8 $q21, killed $q21
+ RET_ReallyLR
+...
+---
+name: impdef_both_same
+body: |
+ bb.0:
+ liveins: $lr
+ ; CHECK-LABEL: name: impdef_both_same
+ ; CHECK: liveins: $lr
+ ; CHECK-NEXT: {{ $}}
+ ; CHECK-NEXT: renamable $q5, renamable $q20 = LDPQi renamable $lr, 3, implicit-def $q4_q5 :: (load (s128))
+ ; CHECK-NEXT: $q0 = ORRv16i8 $q4, killed $q4
+ ; CHECK-NEXT: $q1 = ORRv16i8 $q5, killed $q5
+ ; CHECK-NEXT: RET_ReallyLR
+ renamable $q5 = LDRQui renamable $lr, 3, implicit-def $q4_q5 :: (load (s128))
+ renamable $q20 = LDRQui renamable $lr, 4, implicit-def $q4_q5 :: (load (s128))
+ $q0 = ORRv16i8 $q4, killed $q4
+ $q1 = ORRv16i8 $q5, killed $q5
+ RET_ReallyLR
+...
More information about the llvm-commits
mailing list