[llvm] [TableGen] Add support for per-write cycle tunables (PR #125870)

Ricardo Jesus via llvm-commits llvm-commits at lists.llvm.org
Wed Feb 5 07:41:56 PST 2025


https://github.com/rj-jesus updated https://github.com/llvm/llvm-project/pull/125870

>From 6eddb57953e186f97f10934022fcc9e96d0a0835 Mon Sep 17 00:00:00 2001
From: Ricardo Jesus <rjj at nvidia.com>
Date: Thu, 23 Jan 2025 04:04:21 -0800
Subject: [PATCH 1/3] Pre-commit test

---
 llvm/test/TableGen/PreWriteCycleCount.td | 39 ++++++++++++++++++++++++
 1 file changed, 39 insertions(+)
 create mode 100644 llvm/test/TableGen/PreWriteCycleCount.td

diff --git a/llvm/test/TableGen/PreWriteCycleCount.td b/llvm/test/TableGen/PreWriteCycleCount.td
new file mode 100644
index 000000000000000..d3e7006795cff7e
--- /dev/null
+++ b/llvm/test/TableGen/PreWriteCycleCount.td
@@ -0,0 +1,39 @@
+// RUN: llvm-tblgen -gen-subtarget -I %p/../../include %s 2>&1 | FileCheck %s
+
+// Make sure that ReadAdvance entries with multiple writes are correctly
+// handled.
+
+include "llvm/Target/Target.td"
+
+def MyTarget : Target;
+
+let OutOperandList = (outs), InOperandList = (ins) in {
+  def Inst_A : Instruction;
+  def Inst_B : Instruction;
+  def Inst_C : Instruction;
+}
+
+let CompleteModel = 0 in {
+  def SchedModel_A: SchedMachineModel;
+}
+
+def Read_D : SchedRead;
+
+// CHECK: extern const llvm::MCReadAdvanceEntry MyTargetReadAdvanceTable[] = {
+// CHECK-NEXT:  {0,  0,  0}, // Invalid
+// CHECK-NEXT:  {0,  3,  2} // #1
+// CHECK-NEXT: }; // MyTargetReadAdvanceTable
+
+let SchedModel = SchedModel_A in {
+  def Write_A : SchedWriteRes<[]>;
+  def Write_B : SchedWriteRes<[]>;
+  def Write_C : SchedWriteRes<[]>;
+
+  def : InstRW<[Write_A], (instrs Inst_A)>;
+  def : InstRW<[Write_B], (instrs Inst_B)>;
+  def : InstRW<[Write_C, Read_D], (instrs Inst_C)>;
+
+  def : ReadAdvance<Read_D, 2, [Write_C]>;
+}
+
+def ProcessorA: ProcessorModel<"ProcessorA", SchedModel_A, []>;

>From 2c41e9329a575ba4aed232276a19f31fcb26015d Mon Sep 17 00:00:00 2001
From: Ricardo Jesus <rjj at nvidia.com>
Date: Wed, 22 Jan 2025 10:26:22 -0800
Subject: [PATCH 2/3] [TableGen] Add support for per-write cycle tunables

This patch adds support for describing per-write resource cycle counts
for ReadAdvance records via a new optional field called `tunables'.

This makes it possible to declare ReadAdvance records such as:

  def : ReadAdvance<Read_C, 1, [Write_A, Write_B], [2]>;

The above will effectivelly declare two entries in the ReadAdvance
table for Read_C, one for Write_A with a cycle count of 1+2, and one for
Write_B with a cycle count of 1+0 (omitted values are assumed 0).

The field `tunables' provides a list of deltas relative to the base
`cycle' count of the ReadAdvance. Since the field is optional and
defaults to a list of 0's, this change doesn't affect current targets.
---
 llvm/include/llvm/Target/TargetSchedule.td | 14 +++++++++-----
 llvm/test/TableGen/PreWriteCycleCount.td   |  6 ++++--
 llvm/utils/TableGen/SubtargetEmitter.cpp   | 19 +++++++++++++------
 3 files changed, 26 insertions(+), 13 deletions(-)

diff --git a/llvm/include/llvm/Target/TargetSchedule.td b/llvm/include/llvm/Target/TargetSchedule.td
index 2562ed0901303fe..4b82c1e2410fc8c 100644
--- a/llvm/include/llvm/Target/TargetSchedule.td
+++ b/llvm/include/llvm/Target/TargetSchedule.td
@@ -321,9 +321,11 @@ class SchedWriteRes<list<ProcResourceKind> resources> : SchedWrite,
 // Define values common to ReadAdvance and SchedReadAdvance.
 //
 // SchedModel ties these resources to a processor.
-class ProcReadAdvance<int cycles, list<SchedWrite> writes = []> {
+class ProcReadAdvance<int cycles, list<SchedWrite> writes = [],
+                      list<int> tunables = []> {
   int Cycles = cycles;
   list<SchedWrite> ValidWrites = writes;
+  list<int> CycleTunables = tunables;
   // Allow a processor to mark some scheduling classes as unsupported
   // for stronger verification.
   bit Unsupported = false;
@@ -340,15 +342,17 @@ class ProcReadAdvance<int cycles, list<SchedWrite> writes = []> {
 // indicate operands that are always read this number of Cycles later
 // than a normal register read, allowing the read's parent instruction
 // to issue earlier relative to the writer.
-class ReadAdvance<SchedRead read, int cycles, list<SchedWrite> writes = []>
-  : ProcReadAdvance<cycles, writes> {
+class ReadAdvance<SchedRead read, int cycles, list<SchedWrite> writes = [],
+                  list<int> tunables = []>
+  : ProcReadAdvance<cycles, writes, tunables> {
   SchedRead ReadType = read;
 }
 
 // Directly associate a new SchedRead type with a delay and optional
 // pipeline bypass. For use with InstRW or ItinRW.
-class SchedReadAdvance<int cycles, list<SchedWrite> writes = []> : SchedRead,
-  ProcReadAdvance<cycles, writes>;
+class SchedReadAdvance<int cycles, list<SchedWrite> writes = [],
+                       list<int> tunables = []>
+  : SchedRead, ProcReadAdvance<cycles, writes, tunables>;
 
 // Define SchedRead defaults. Reads seldom need special treatment.
 def ReadDefault : SchedRead;
diff --git a/llvm/test/TableGen/PreWriteCycleCount.td b/llvm/test/TableGen/PreWriteCycleCount.td
index d3e7006795cff7e..40260a9bacef449 100644
--- a/llvm/test/TableGen/PreWriteCycleCount.td
+++ b/llvm/test/TableGen/PreWriteCycleCount.td
@@ -21,7 +21,9 @@ def Read_D : SchedRead;
 
 // CHECK: extern const llvm::MCReadAdvanceEntry MyTargetReadAdvanceTable[] = {
 // CHECK-NEXT:  {0,  0,  0}, // Invalid
-// CHECK-NEXT:  {0,  3,  2} // #1
+// CHECK-NEXT:  {0,  1,  1}, // #1
+// CHECK-NEXT:  {0,  2,  3}, // #2
+// CHECK-NEXT:  {0,  3,  2} // #3
 // CHECK-NEXT: }; // MyTargetReadAdvanceTable
 
 let SchedModel = SchedModel_A in {
@@ -33,7 +35,7 @@ let SchedModel = SchedModel_A in {
   def : InstRW<[Write_B], (instrs Inst_B)>;
   def : InstRW<[Write_C, Read_D], (instrs Inst_C)>;
 
-  def : ReadAdvance<Read_D, 2, [Write_C]>;
+  def : ReadAdvance<Read_D, 2, [Write_A, Write_B, Write_C], [-1, 1]>;
 }
 
 def ProcessorA: ProcessorModel<"ProcessorA", SchedModel_A, []>;
diff --git a/llvm/utils/TableGen/SubtargetEmitter.cpp b/llvm/utils/TableGen/SubtargetEmitter.cpp
index 49362ff5ef65563..ec0990292738230 100644
--- a/llvm/utils/TableGen/SubtargetEmitter.cpp
+++ b/llvm/utils/TableGen/SubtargetEmitter.cpp
@@ -1308,23 +1308,30 @@ void SubtargetEmitter::genSchedClassTables(const CodeGenProcModel &ProcModel,
       }
       ConstRecVec ValidWrites =
           ReadAdvance->getValueAsListOfDefs("ValidWrites");
-      IdxVec WriteIDs;
+      std::vector<int64_t> CycleTunables =
+          ReadAdvance->getValueAsListOfInts("CycleTunables");
+      std::vector<std::pair<unsigned, int>> WriteIDs;
+      if (!CycleTunables.empty() && CycleTunables.size() > ValidWrites.size())
+        PrintFatalError(ReadAdvance->getLoc(),
+                        "If specified, CycleTunables must have at most the "
+                        "same number of elements of ValidWrites.\n");
+      CycleTunables.resize(ValidWrites.size(), 0);
       if (ValidWrites.empty())
-        WriteIDs.push_back(0);
+        WriteIDs.push_back(std::make_pair(0, 0));
       else {
-        for (const Record *VW : ValidWrites) {
+        for (const auto [VW, CT] : zip_equal(ValidWrites, CycleTunables)) {
           unsigned WriteID = SchedModels.getSchedRWIdx(VW, /*IsRead=*/false);
           assert(WriteID != 0 &&
                  "Expected a valid SchedRW in the list of ValidWrites");
-          WriteIDs.push_back(WriteID);
+          WriteIDs.push_back(std::make_pair(WriteID, CT));
         }
       }
       llvm::sort(WriteIDs);
-      for (unsigned W : WriteIDs) {
+      for (const auto &[W, T] : WriteIDs) {
         MCReadAdvanceEntry RAEntry;
         RAEntry.UseIdx = UseIdx;
         RAEntry.WriteResourceID = W;
-        RAEntry.Cycles = ReadAdvance->getValueAsInt("Cycles");
+        RAEntry.Cycles = ReadAdvance->getValueAsInt("Cycles") + T;
         ReadAdvanceEntries.push_back(RAEntry);
       }
     }

>From 6d553fedf7657a2ce3ca26916362840c9697d8cc Mon Sep 17 00:00:00 2001
From: Ricardo Jesus <rjj at nvidia.com>
Date: Wed, 5 Feb 2025 15:41:03 +0000
Subject: [PATCH 3/3] Fix typo in name

---
 .../TableGen/{PreWriteCycleCount.td => PerWriteCycleCount.td}     | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename llvm/test/TableGen/{PreWriteCycleCount.td => PerWriteCycleCount.td} (100%)

diff --git a/llvm/test/TableGen/PreWriteCycleCount.td b/llvm/test/TableGen/PerWriteCycleCount.td
similarity index 100%
rename from llvm/test/TableGen/PreWriteCycleCount.td
rename to llvm/test/TableGen/PerWriteCycleCount.td



More information about the llvm-commits mailing list