[llvm] [AMDGPU] Add cl option to relax lds dma waitcnt (PR #131842)
Austin Kerbow via llvm-commits
llvm-commits at lists.llvm.org
Tue Mar 18 09:16:56 PDT 2025
https://github.com/kerbowa created https://github.com/llvm/llvm-project/pull/131842
None
>From d491d2b02a40a8aedc1e54c2b2c8fe1bfb8e8cf1 Mon Sep 17 00:00:00 2001
From: Austin Kerbow <Austin.Kerbow at amd.com>
Date: Fri, 14 Mar 2025 17:44:37 -0700
Subject: [PATCH] [AMDGPU] Add cl option to relax lds dma waitcnt
---
llvm/lib/Target/AMDGPU/SIInsertWaitcnts.cpp | 7 ++++++-
1 file changed, 6 insertions(+), 1 deletion(-)
diff --git a/llvm/lib/Target/AMDGPU/SIInsertWaitcnts.cpp b/llvm/lib/Target/AMDGPU/SIInsertWaitcnts.cpp
index 239f2664f59f3..10316bf6eb872 100644
--- a/llvm/lib/Target/AMDGPU/SIInsertWaitcnts.cpp
+++ b/llvm/lib/Target/AMDGPU/SIInsertWaitcnts.cpp
@@ -58,6 +58,11 @@ static cl::opt<bool> ForceEmitZeroLoadFlag(
cl::desc("Force all waitcnt load counters to wait until 0"),
cl::init(false), cl::Hidden);
+static cl::opt<bool>
+ RelaxLDSDMA("amdgpu-relax-lds-dma-waitcnt",
+ cl::desc("Relax the waitcnt for LDS DMA instructions"),
+ cl::init(false), cl::Hidden);
+
namespace {
// Class of object that encapsulates latest instruction counter score
// associated with the operand. Used for determining whether
@@ -1748,7 +1753,7 @@ bool SIInsertWaitcnts::generateWaitcntInstBefore(MachineInstr &MI,
}
}
}
- if (!FoundAliasingStore)
+ if (!FoundAliasingStore || RelaxLDSDMA)
ScoreBrackets.determineWait(LOAD_CNT, RegNo, Wait);
if (Memop->isStore()) {
ScoreBrackets.determineWait(EXP_CNT, RegNo, Wait);
More information about the llvm-commits
mailing list