[llvm] [MemCpyOpt] Avoid infinite loops in `MemCpyOptPass::processMemCpyMemCpyDependence` (PR #103218)

Yingwei Zheng via llvm-commits llvm-commits at lists.llvm.org
Thu Aug 22 00:48:00 PDT 2024


https://github.com/dtcxzyw updated https://github.com/llvm/llvm-project/pull/103218

>From 7bc99d38c051c67517696aef2644725e140a57f0 Mon Sep 17 00:00:00 2001
From: Yingwei Zheng <dtcxzyw2333 at gmail.com>
Date: Tue, 13 Aug 2024 22:36:00 +0800
Subject: [PATCH 1/2] [MemCpyOpt] Avoid infinite loops in
 `MemCpyOptPass::processMemCpyMemCpyDependence`

---
 llvm/lib/Transforms/Scalar/MemCpyOptimizer.cpp |  4 ++++
 llvm/test/Transforms/MemCpyOpt/pr102994.ll     | 18 ++++++++++++++++++
 2 files changed, 22 insertions(+)
 create mode 100644 llvm/test/Transforms/MemCpyOpt/pr102994.ll

diff --git a/llvm/lib/Transforms/Scalar/MemCpyOptimizer.cpp b/llvm/lib/Transforms/Scalar/MemCpyOptimizer.cpp
index 1d779128e454c1..3f15fa2163d270 100644
--- a/llvm/lib/Transforms/Scalar/MemCpyOptimizer.cpp
+++ b/llvm/lib/Transforms/Scalar/MemCpyOptimizer.cpp
@@ -1193,6 +1193,10 @@ bool MemCpyOptPass::processMemCpyMemCpyDependence(MemCpyInst *M,
       CopySourceAlign = commonAlignment(*CopySourceAlign, MForwardOffset);
   }
 
+  // Avoid infinite loops
+  if (BAA.isMustAlias(M->getSource(), CopySource))
+    return false;
+
   // Verify that the copied-from memory doesn't change in between the two
   // transfers.  For example, in:
   //    memcpy(a <- b)
diff --git a/llvm/test/Transforms/MemCpyOpt/pr102994.ll b/llvm/test/Transforms/MemCpyOpt/pr102994.ll
new file mode 100644
index 00000000000000..53d6335f6e9d0b
--- /dev/null
+++ b/llvm/test/Transforms/MemCpyOpt/pr102994.ll
@@ -0,0 +1,18 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
+; RUN: opt -S -passes=memcpyopt < %s | FileCheck %s
+
+ at g1 = external global i8
+ at g2 = external global [64 x i8]
+
+define void @func() {
+; CHECK-LABEL: define void @func() {
+; CHECK-NEXT:  [[ENTRY:.*:]]
+; CHECK-NEXT:    call void @llvm.memcpy.p0.p0.i64(ptr getelementptr inbounds (i8, ptr @g2, i64 16), ptr getelementptr inbounds nuw (i8, ptr @g2, i64 16), i64 20, i1 false)
+; CHECK-NEXT:    call void @llvm.memcpy.p0.p0.i64(ptr @g1, ptr getelementptr inbounds (i8, ptr @g2, i64 24), i64 1, i1 false)
+; CHECK-NEXT:    ret void
+;
+entry:
+  call void @llvm.memcpy.p0.p0.i64(ptr getelementptr inbounds (i8, ptr @g2, i64 16), ptr getelementptr inbounds nuw (i8, ptr @g2, i64 16), i64 20, i1 false)
+  call void @llvm.memcpy.p0.p0.i64(ptr @g1, ptr getelementptr inbounds (i8, ptr @g2, i64 24), i64 1, i1 false)
+  ret void
+}

>From bd8d6dd19ca3f424751875d3d026749d6d935bd6 Mon Sep 17 00:00:00 2001
From: Yingwei Zheng <dtcxzyw2333 at gmail.com>
Date: Thu, 22 Aug 2024 15:47:09 +0800
Subject: [PATCH 2/2] [MemCpyOpt] Add new tests without constantexpr

---
 llvm/test/Transforms/MemCpyOpt/pr102994.ll | 21 +++++++++++++++++++++
 1 file changed, 21 insertions(+)

diff --git a/llvm/test/Transforms/MemCpyOpt/pr102994.ll b/llvm/test/Transforms/MemCpyOpt/pr102994.ll
index 53d6335f6e9d0b..9a782b9b3752a2 100644
--- a/llvm/test/Transforms/MemCpyOpt/pr102994.ll
+++ b/llvm/test/Transforms/MemCpyOpt/pr102994.ll
@@ -3,6 +3,7 @@
 
 @g1 = external global i8
 @g2 = external global [64 x i8]
+ at g3 = global i8 0, align 1
 
 define void @func() {
 ; CHECK-LABEL: define void @func() {
@@ -16,3 +17,23 @@ entry:
   call void @llvm.memcpy.p0.p0.i64(ptr @g1, ptr getelementptr inbounds (i8, ptr @g2, i64 24), i64 1, i1 false)
   ret void
 }
+
+define void @func2(ptr %p) {
+; CHECK-LABEL: define void @func2(
+; CHECK-SAME: ptr [[P:%.*]]) {
+; CHECK-NEXT:  [[ENTRY:.*:]]
+; CHECK-NEXT:    [[GEP1:%.*]] = getelementptr i8, ptr [[P]], i64 32
+; CHECK-NEXT:    [[GEP2:%.*]] = getelementptr i8, ptr [[P]], i64 34
+; CHECK-NEXT:    [[GEP3:%.*]] = getelementptr i8, ptr [[P]], i64 32
+; CHECK-NEXT:    call void @llvm.memcpy.p0.p0.i64(ptr [[GEP1]], ptr [[GEP3]], i64 32, i1 false)
+; CHECK-NEXT:    call void @llvm.memcpy.p0.p0.i64(ptr @g3, ptr [[GEP2]], i64 1, i1 false)
+; CHECK-NEXT:    ret void
+;
+entry:
+  %gep1 = getelementptr i8, ptr %p, i64 32
+  %gep2 = getelementptr i8, ptr %p, i64 34
+  %gep3 = getelementptr i8, ptr %p, i64 32
+  call void @llvm.memcpy.p0.p0.i64(ptr %gep1, ptr %gep3, i64 32, i1 false)
+  call void @llvm.memcpy.p0.p0.i64(ptr @g3, ptr %gep2, i64 1, i1 false)
+  ret void
+}



More information about the llvm-commits mailing list