[llvm] [AMDGPU] Propagate AA info in vector load/store splitting. (PR #168871)
Leon Clark via llvm-commits
llvm-commits at lists.llvm.org
Fri Nov 21 07:37:44 PST 2025
https://github.com/PeddleSpam updated https://github.com/llvm/llvm-project/pull/168871
>From 0ba764985d74ed02e1c0eda6d7436d50ab3a01c3 Mon Sep 17 00:00:00 2001
From: Leon Clark <leoclark at amd.com>
Date: Thu, 20 Nov 2025 12:35:56 +0000
Subject: [PATCH 1/3] Propagate AA info in vector load/store splitting.
---
llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp | 11 +++++++----
1 file changed, 7 insertions(+), 4 deletions(-)
diff --git a/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp b/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp
index 19b3ae5e695c7..5b24166b1a8be 100644
--- a/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp
+++ b/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp
@@ -1890,12 +1890,14 @@ SDValue AMDGPUTargetLowering::SplitVectorLoad(const SDValue Op,
SDValue LoLoad = DAG.getExtLoad(Load->getExtensionType(), SL, LoVT,
Load->getChain(), BasePtr, SrcValue, LoMemVT,
- BaseAlign, Load->getMemOperand()->getFlags());
+ BaseAlign, Load->getMemOperand()->getFlags(),
+ Load->getAAInfo());
SDValue HiPtr = DAG.getObjectPtrOffset(SL, BasePtr, TypeSize::getFixed(Size));
SDValue HiLoad =
DAG.getExtLoad(Load->getExtensionType(), SL, HiVT, Load->getChain(),
HiPtr, SrcValue.getWithOffset(LoMemVT.getStoreSize()),
- HiMemVT, HiAlign, Load->getMemOperand()->getFlags());
+ HiMemVT, HiAlign, Load->getMemOperand()->getFlags(),
+ Load->getAAInfo());
SDValue Join;
if (LoVT == HiVT) {
@@ -1983,10 +1985,11 @@ SDValue AMDGPUTargetLowering::SplitVectorStore(SDValue Op,
SDValue LoStore =
DAG.getTruncStore(Chain, SL, Lo, BasePtr, SrcValue, LoMemVT, BaseAlign,
- Store->getMemOperand()->getFlags());
+ Store->getMemOperand()->getFlags(), Store->getAAInfo());
SDValue HiStore =
DAG.getTruncStore(Chain, SL, Hi, HiPtr, SrcValue.getWithOffset(Size),
- HiMemVT, HiAlign, Store->getMemOperand()->getFlags());
+ HiMemVT, HiAlign, Store->getMemOperand()->getFlags(),
+ Store->getAAInfo());
return DAG.getNode(ISD::TokenFactor, SL, MVT::Other, LoStore, HiStore);
}
>From adc94c3b01abd2c9fefebb77c7e0b507bd8c4a5b Mon Sep 17 00:00:00 2001
From: Leon Clark <leoclark at amd.com>
Date: Thu, 20 Nov 2025 13:04:12 +0000
Subject: [PATCH 2/3] Formatting.
---
llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp | 23 ++++++++-----------
1 file changed, 10 insertions(+), 13 deletions(-)
diff --git a/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp b/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp
index 5b24166b1a8be..971dfdbe3e70a 100644
--- a/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp
+++ b/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp
@@ -1888,16 +1888,14 @@ SDValue AMDGPUTargetLowering::SplitVectorLoad(const SDValue Op,
Align BaseAlign = Load->getAlign();
Align HiAlign = commonAlignment(BaseAlign, Size);
- SDValue LoLoad = DAG.getExtLoad(Load->getExtensionType(), SL, LoVT,
- Load->getChain(), BasePtr, SrcValue, LoMemVT,
- BaseAlign, Load->getMemOperand()->getFlags(),
- Load->getAAInfo());
+ SDValue LoLoad = DAG.getExtLoad(
+ Load->getExtensionType(), SL, LoVT, Load->getChain(), BasePtr, SrcValue,
+ LoMemVT, BaseAlign, Load->getMemOperand()->getFlags(), Load->getAAInfo());
SDValue HiPtr = DAG.getObjectPtrOffset(SL, BasePtr, TypeSize::getFixed(Size));
- SDValue HiLoad =
- DAG.getExtLoad(Load->getExtensionType(), SL, HiVT, Load->getChain(),
- HiPtr, SrcValue.getWithOffset(LoMemVT.getStoreSize()),
- HiMemVT, HiAlign, Load->getMemOperand()->getFlags(),
- Load->getAAInfo());
+ SDValue HiLoad = DAG.getExtLoad(
+ Load->getExtensionType(), SL, HiVT, Load->getChain(), HiPtr,
+ SrcValue.getWithOffset(LoMemVT.getStoreSize()), HiMemVT, HiAlign,
+ Load->getMemOperand()->getFlags(), Load->getAAInfo());
SDValue Join;
if (LoVT == HiVT) {
@@ -1986,10 +1984,9 @@ SDValue AMDGPUTargetLowering::SplitVectorStore(SDValue Op,
SDValue LoStore =
DAG.getTruncStore(Chain, SL, Lo, BasePtr, SrcValue, LoMemVT, BaseAlign,
Store->getMemOperand()->getFlags(), Store->getAAInfo());
- SDValue HiStore =
- DAG.getTruncStore(Chain, SL, Hi, HiPtr, SrcValue.getWithOffset(Size),
- HiMemVT, HiAlign, Store->getMemOperand()->getFlags(),
- Store->getAAInfo());
+ SDValue HiStore = DAG.getTruncStore(
+ Chain, SL, Hi, HiPtr, SrcValue.getWithOffset(Size), HiMemVT, HiAlign,
+ Store->getMemOperand()->getFlags(), Store->getAAInfo());
return DAG.getNode(ISD::TokenFactor, SL, MVT::Other, LoStore, HiStore);
}
>From fe0995e1995b8b1d1a8bae8941e2979d3120a82a Mon Sep 17 00:00:00 2001
From: Leon Clark <leoclark at amd.com>
Date: Fri, 21 Nov 2025 15:37:19 +0000
Subject: [PATCH 3/3] Add tests.
---
.../AMDGPU/si-split-load-store-alias-info.ll | 26 +++++++++++++++++++
1 file changed, 26 insertions(+)
create mode 100644 llvm/test/CodeGen/AMDGPU/si-split-load-store-alias-info.ll
diff --git a/llvm/test/CodeGen/AMDGPU/si-split-load-store-alias-info.ll b/llvm/test/CodeGen/AMDGPU/si-split-load-store-alias-info.ll
new file mode 100644
index 0000000000000..90edb30f1a98c
--- /dev/null
+++ b/llvm/test/CodeGen/AMDGPU/si-split-load-store-alias-info.ll
@@ -0,0 +1,26 @@
+; RUN: llc -mtriple=amdgcn -stop-after finalize-isel < %s | FileCheck %s
+
+; This test verifies that instruction selection will propagate alias metadata
+; to split loads and stores.
+
+; CHECK: %{{[0-9]+}}:vreg_64 = DS_READ_B64 {{.*}} :: (load (s64) from %{{.*}}, !alias.scope !{{[0-9]+}}, !noalias !{{[0-9]+}}, addrspace 3)
+; CHECK: DS_WRITE_B64 {{.*}} :: (store (s64) into %{{.*}}, !alias.scope !{{[0-9]+}}, !noalias !{{[0-9]+}}, addrspace 3)
+
+define amdgpu_kernel void @test(ptr addrspace(3) noalias %in, ptr addrspace(3) noalias %out) {
+ %idx = call i32 @llvm.amdgcn.workitem.id.x()
+ %in.addr = getelementptr <16 x float>, ptr addrspace(3) %in, i32 %idx
+ %val.0 = load <16 x float>, ptr addrspace(3) %in.addr, align 32, !alias.scope !4, !noalias !5
+ %val.1 = call <16 x float> @llvm.amdgcn.wmma.f32.16x16x16.f32.v16f32.v16f32(<16 x float> %val.0, <16 x float> %val.0, <16 x float> %val.0, i1 false)
+ %out.addr = getelementptr <16 x float>, ptr addrspace(3) %out, i32 %idx
+ store <16 x float> %val.1, ptr addrspace(3) %out.addr, align 32, !alias.scope !5, !noalias !4
+ ret void
+}
+
+declare i32 @llvm.amdgcn.workitem.id.x()
+declare <16 x float> @llvm.amdgcn.wmma.f32.16x16x16.f32.v16f32.v16f32(<16 x float>, <16 x float>, <16 x float>, i1 immarg)
+
+!0 = !{!"inout.domain"}
+!1 = !{!"in.scope", !0}
+!2 = !{!"out.scope", !0}
+!4 = !{!1}
+!5 = !{!2}
More information about the llvm-commits
mailing list