[llvm] [LLVM][NVPTX] Enable family specific support for a few intrinsics (PR #173268)

Pradeep Kumar via llvm-commits llvm-commits at lists.llvm.org
Tue Dec 23 00:02:44 PST 2025


================
@@ -165,8 +143,32 @@ class NVPTXSubtarget : public NVPTXGenSubtargetInfo {
   }
 
   bool hasTcgen05MMAScaleInputDImm() const {
-    return FullSmVersion == 1003 && PTXVersion >= 86;
+    return hasPTXWithFamilySMs(88, {100}) || hasPTXWithAccelSMs(86, {100});
+  }
+
+  bool hasTcgen05MMAI8Kind() const {
+    return hasPTXWithAccelSMs(86, {100, 101}) ||
+           hasPTXWithAccelSMs(90, {100, 110});
+  }
+
+  bool hasTcgen05MMASparseMxf4nvf4() const {
+    return hasPTXWithAccelSMs(87, {100, 101, 103}) ||
+           hasPTXWithAccelSMs(90, {100, 110, 103});
+  }
+
+  bool hasTcgen05MMASparseMxf4() const {
+    return hasPTXWithAccelSMs(86, {100, 101, 103}) ||
+           hasPTXWithAccelSMs(90, {100, 110, 103});
+  }
+
+  bool hasReduxSyncF32() const {
+    return hasPTXWithFamilySMs(88, {100}) || hasPTXWithAccelSMs(86, {100});
+  }
+
+  bool hasSparseMmaWithBlockScaleF4() const {
----------------
schwarzschild-radius wrote:

Updated function name to `hasMMASparseBlockScaleF4`

https://github.com/llvm/llvm-project/pull/173268


More information about the llvm-commits mailing list