[llvm] [AMDGPU] Remove s_delay_alu for VALU->SGPR->SALU (PR #127212)

Ana Mihajlovic via llvm-commits llvm-commits at lists.llvm.org
Fri Feb 21 07:56:03 PST 2025


================
@@ -371,12 +376,51 @@ class AMDGPUInsertDelayAlu : public MachineFunctionPass {
             for (MCRegUnit Unit : TRI->regunits(Op.getReg())) {
               auto It = State.find(Unit);
               if (It != State.end()) {
-                Delay.merge(It->second);
-                State.erase(Unit);
+                if (SII->isSALU(MI.getOpcode()) &&
+                    AMDGPU::isSGPR(Op.getReg(), TRI) &&
+                    It->second.VALUCycles > 0) {
+                  deletedCyclesNum = It->second.VALUCycles;
+                  State.erase(Unit);
+                  VALUSALUStall = true;
+                } else {
+                  Delay.merge(It->second);
+                  State.erase(Unit);
+                }
               }
             }
           }
         }
+        unsigned maxCycles = 0;
+        unsigned lastWrite = 0;
+        if (Type != OTHER) {
+          for (const auto &Op : MI.defs()) {
+            for (MCRegUnit Unit : TRI->regunits(Op.getReg())) {
----------------
mihajlovicana wrote:

You mean a helper function for the double loop ?

https://github.com/llvm/llvm-project/pull/127212


More information about the llvm-commits mailing list