[llvm] [CodeGenPrepare] Drop nsw flags in `optimizeLoadExt` (PR #118180)
via llvm-commits
llvm-commits at lists.llvm.org
Sat Nov 30 08:59:09 PST 2024
llvmbot wrote:
<!--LLVM PR SUMMARY COMMENT-->
@llvm/pr-subscribers-llvm-transforms
Author: Yingwei Zheng (dtcxzyw)
<details>
<summary>Changes</summary>
Alive2: https://alive2.llvm.org/ce/z/pMcD7q
Closes https://github.com/llvm/llvm-project/issues/118172.
---
Full diff: https://github.com/llvm/llvm-project/pull/118180.diff
2 Files Affected:
- (modified) llvm/lib/CodeGen/CodeGenPrepare.cpp (+7)
- (added) llvm/test/Transforms/CodeGenPrepare/X86/pr118172.ll (+86)
``````````diff
diff --git a/llvm/lib/CodeGen/CodeGenPrepare.cpp b/llvm/lib/CodeGen/CodeGenPrepare.cpp
index ead8aa6d220973..83c6ecd401039f 100644
--- a/llvm/lib/CodeGen/CodeGenPrepare.cpp
+++ b/llvm/lib/CodeGen/CodeGenPrepare.cpp
@@ -7138,6 +7138,7 @@ bool CodeGenPrepare::optimizeLoadExt(LoadInst *Load) {
SmallVector<Instruction *, 8> WorkList;
SmallPtrSet<Instruction *, 16> Visited;
SmallVector<Instruction *, 8> AndsToMaybeRemove;
+ SmallVector<Instruction *, 8> DropFlags;
for (auto *U : Load->users())
WorkList.push_back(cast<Instruction>(U));
@@ -7185,6 +7186,7 @@ bool CodeGenPrepare::optimizeLoadExt(LoadInst *Load) {
return false;
uint64_t ShiftAmt = ShlC->getLimitedValue(BitWidth - 1);
DemandBits.setLowBits(BitWidth - ShiftAmt);
+ DropFlags.push_back(I);
break;
}
@@ -7192,6 +7194,7 @@ bool CodeGenPrepare::optimizeLoadExt(LoadInst *Load) {
EVT TruncVT = TLI->getValueType(*DL, I->getType());
unsigned TruncBitWidth = TruncVT.getSizeInBits();
DemandBits.setLowBits(TruncBitWidth);
+ DropFlags.push_back(I);
break;
}
@@ -7249,6 +7252,10 @@ bool CodeGenPrepare::optimizeLoadExt(LoadInst *Load) {
++NumAndUses;
}
+ // NSW flags may not longer hold.
+ for (auto *Inst : DropFlags)
+ Inst->setHasNoSignedWrap(false);
+
++NumAndsAdded;
return true;
}
diff --git a/llvm/test/Transforms/CodeGenPrepare/X86/pr118172.ll b/llvm/test/Transforms/CodeGenPrepare/X86/pr118172.ll
new file mode 100644
index 00000000000000..a599129466b35c
--- /dev/null
+++ b/llvm/test/Transforms/CodeGenPrepare/X86/pr118172.ll
@@ -0,0 +1,86 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
+; RUN: opt -S -passes='require<profile-summary>,function(codegenprepare)' -mtriple=x86_64-unknown-unknown < %s | FileCheck %s
+
+; Make sure the nsw flag is dropped when the load ext is combined.
+define i32 @simplify_load_ext_drop_trunc_nsw(ptr %p) {
+; CHECK-LABEL: define i32 @simplify_load_ext_drop_trunc_nsw(
+; CHECK-SAME: ptr [[P:%.*]]) {
+; CHECK-NEXT: [[ENTRY:.*:]]
+; CHECK-NEXT: [[X:%.*]] = load i32, ptr [[P]], align 4
+; CHECK-NEXT: [[TMP0:%.*]] = and i32 [[X]], 255
+; CHECK-NEXT: [[TRUNC:%.*]] = trunc i32 [[TMP0]] to i8
+; CHECK-NEXT: [[EXT1:%.*]] = sext i8 [[TRUNC]] to i16
+; CHECK-NEXT: call void @use(i32 [[TMP0]])
+; CHECK-NEXT: [[EXT2:%.*]] = zext i16 [[EXT1]] to i32
+; CHECK-NEXT: ret i32 [[EXT2]]
+;
+entry:
+ %x = load i32, ptr %p, align 4
+ %trunc = trunc nsw i32 %x to i8
+ %ext1 = sext i8 %trunc to i16
+ %conv2 = and i32 %x, 255
+ call void @use(i32 %conv2)
+ %ext2 = zext i16 %ext1 to i32
+ ret i32 %ext2
+}
+
+; Make sure the nsw flag is dropped when the load ext is combined.
+define i32 @simplify_load_ext_drop_shl_nsw(ptr %p) {
+; CHECK-LABEL: define i32 @simplify_load_ext_drop_shl_nsw(
+; CHECK-SAME: ptr [[P:%.*]]) {
+; CHECK-NEXT: [[ENTRY:.*:]]
+; CHECK-NEXT: [[X:%.*]] = load i32, ptr [[P]], align 4
+; CHECK-NEXT: [[TMP0:%.*]] = and i32 [[X]], 255
+; CHECK-NEXT: [[SHL:%.*]] = shl i32 [[TMP0]], 24
+; CHECK-NEXT: call void @use(i32 [[TMP0]])
+; CHECK-NEXT: ret i32 [[SHL]]
+;
+entry:
+ %x = load i32, ptr %p, align 4
+ %shl = shl nsw i32 %x, 24
+ %conv2 = and i32 %x, 255
+ call void @use(i32 %conv2)
+ ret i32 %shl
+}
+
+define i32 @simplify_load_ext_keep_trunc_nuw(ptr %p) {
+; CHECK-LABEL: define i32 @simplify_load_ext_keep_trunc_nuw(
+; CHECK-SAME: ptr [[P:%.*]]) {
+; CHECK-NEXT: [[ENTRY:.*:]]
+; CHECK-NEXT: [[X:%.*]] = load i32, ptr [[P]], align 4
+; CHECK-NEXT: [[TMP0:%.*]] = and i32 [[X]], 255
+; CHECK-NEXT: [[TRUNC:%.*]] = trunc nuw i32 [[TMP0]] to i8
+; CHECK-NEXT: [[EXT1:%.*]] = sext i8 [[TRUNC]] to i16
+; CHECK-NEXT: call void @use(i32 [[TMP0]])
+; CHECK-NEXT: [[EXT2:%.*]] = zext i16 [[EXT1]] to i32
+; CHECK-NEXT: ret i32 [[EXT2]]
+;
+entry:
+ %x = load i32, ptr %p, align 4
+ %trunc = trunc nuw i32 %x to i8
+ %ext1 = sext i8 %trunc to i16
+ %conv2 = and i32 %x, 255
+ call void @use(i32 %conv2)
+ %ext2 = zext i16 %ext1 to i32
+ ret i32 %ext2
+}
+
+define i32 @simplify_load_ext_drop_shl_nuw(ptr %p) {
+; CHECK-LABEL: define i32 @simplify_load_ext_drop_shl_nuw(
+; CHECK-SAME: ptr [[P:%.*]]) {
+; CHECK-NEXT: [[ENTRY:.*:]]
+; CHECK-NEXT: [[X:%.*]] = load i32, ptr [[P]], align 4
+; CHECK-NEXT: [[TMP0:%.*]] = and i32 [[X]], 255
+; CHECK-NEXT: [[SHL:%.*]] = shl nuw i32 [[TMP0]], 24
+; CHECK-NEXT: call void @use(i32 [[TMP0]])
+; CHECK-NEXT: ret i32 [[SHL]]
+;
+entry:
+ %x = load i32, ptr %p, align 4
+ %shl = shl nuw i32 %x, 24
+ %conv2 = and i32 %x, 255
+ call void @use(i32 %conv2)
+ ret i32 %shl
+}
+
+declare void @use(i32)
``````````
</details>
https://github.com/llvm/llvm-project/pull/118180
More information about the llvm-commits
mailing list