[Mlir-commits] [mlir] [mlir][memref] Support folding memref.load from global splat constants (PR #176627)
llvmlistbot at llvm.org
llvmlistbot at llvm.org
Sat Jan 17 22:07:16 PST 2026
llvmbot wrote:
<!--LLVM PR SUMMARY COMMENT-->
@llvm/pr-subscribers-mlir
Author: Longsheng Mou (CoTinker)
<details>
<summary>Changes</summary>
This change extends the memref.load folding hook to fold loads from global constant memrefs initialized with splat values.
---
Full diff: https://github.com/llvm/llvm-project/pull/176627.diff
2 Files Affected:
- (modified) mlir/lib/Dialect/MemRef/IR/MemRefOps.cpp (+20)
- (modified) mlir/test/Dialect/MemRef/canonicalize.mlir (+19)
``````````diff
diff --git a/mlir/lib/Dialect/MemRef/IR/MemRefOps.cpp b/mlir/lib/Dialect/MemRef/IR/MemRefOps.cpp
index e0f7a8b452a1d..b15b2a3e24b95 100644
--- a/mlir/lib/Dialect/MemRef/IR/MemRefOps.cpp
+++ b/mlir/lib/Dialect/MemRef/IR/MemRefOps.cpp
@@ -1705,6 +1705,26 @@ OpFoldResult LoadOp::fold(FoldAdaptor adaptor) {
/// load(memrefcast) -> load
if (succeeded(foldMemRefCast(*this)))
return getResult();
+
+ // Fold load from a global constant memref.
+ auto getGlobalOp = getMemref().getDefiningOp<memref::GetGlobalOp>();
+ if (!getGlobalOp)
+ return {};
+
+ // Get to the memref.global defining the symbol.
+ auto global = SymbolTable::lookupNearestSymbolFrom<memref::GlobalOp>(
+ getGlobalOp, getGlobalOp.getNameAttr());
+ if (!global)
+ return {};
+ // Check if the global memref is a constant.
+ auto cstAttr =
+ dyn_cast_or_null<DenseElementsAttr>(global.getConstantInitValue());
+ if (!cstAttr)
+ return {};
+ // If it's a splat constant, we can fold irrespective of indices.
+ if (auto splatAttr = dyn_cast<SplatElementsAttr>(cstAttr))
+ return splatAttr.getSplatValue<Attribute>();
+
return OpFoldResult();
}
diff --git a/mlir/test/Dialect/MemRef/canonicalize.mlir b/mlir/test/Dialect/MemRef/canonicalize.mlir
index 122906037b952..a3af67076a1d2 100644
--- a/mlir/test/Dialect/MemRef/canonicalize.mlir
+++ b/mlir/test/Dialect/MemRef/canonicalize.mlir
@@ -1416,6 +1416,25 @@ func.func @load_store_nontemporal(%input : memref<32xf32, affine_map<(d0) -> (d0
// -----
+memref.global "private" constant @__constant_32xf32 : memref<32xf32> = dense<1.000000e+00>
+// CHECK-LABEL: func @fold_const_splat_global
+func.func @fold_const_splat_global() -> memref<32xf32> {
+ // CHECK-NEXT: %[[CST:.*]] = arith.constant 1.000000e+00 : f32
+ %0 = memref.get_global @__constant_32xf32 : memref<32xf32>
+ %alloc = memref.alloc() : memref<32xf32>
+ %c32 = arith.constant 32 : index
+ %c0 = arith.constant 0 : index
+ %c1 = arith.constant 1 : index
+ scf.for %arg0 = %c0 to %c32 step %c1 {
+ %1 = memref.load %0[%arg0] : memref<32xf32>
+ // CHECK: memref.store %[[CST]], %{{.*}}
+ memref.store %1, %alloc[%arg0] : memref<32xf32>
+ }
+ return %alloc : memref<32xf32>
+}
+
+// -----
+
// CHECK-LABEL: func @fold_trivial_memory_space_cast(
// CHECK-SAME: %[[arg:.*]]: memref<?xf32>
// CHECK: return %[[arg]]
``````````
</details>
https://github.com/llvm/llvm-project/pull/176627
More information about the Mlir-commits
mailing list