[llvm] [X86, CodeGen] Add a pattern in PreprocessISelDAG. (PR #85848)
via llvm-commits
llvm-commits at lists.llvm.org
Tue Mar 19 12:05:55 PDT 2024
llvmbot wrote:
<!--LLVM PR SUMMARY COMMENT-->
@llvm/pr-subscribers-backend-x86
Author: Peter Rong (DataCorrupted)
<details>
<summary>Changes</summary>
`%c = shl <X x i1> %a, %b -> %c = %a`
As discussed in #<!-- -->85681, this pattern is added to avoid cannot selection error. Since shift one is either identical or UB, we consider it as identical and replace all uses of %c with %a.
Tests for shl, ashr, lshr are added.
This fixes #<!-- -->85681.
---
Full diff: https://github.com/llvm/llvm-project/pull/85848.diff
2 Files Affected:
- (modified) llvm/lib/Target/X86/X86ISelDAGToDAG.cpp (+10-1)
- (added) llvm/test/CodeGen/X86/pr85681.ll (+39)
``````````diff
diff --git a/llvm/lib/Target/X86/X86ISelDAGToDAG.cpp b/llvm/lib/Target/X86/X86ISelDAGToDAG.cpp
index 4e4241efd63d6b..824a86225b4dd6 100644
--- a/llvm/lib/Target/X86/X86ISelDAGToDAG.cpp
+++ b/llvm/lib/Target/X86/X86ISelDAGToDAG.cpp
@@ -1151,10 +1151,19 @@ void X86DAGToDAGISel::PreprocessISelDAG() {
case ISD::SHL:
case ISD::SRA:
case ISD::SRL: {
+ auto Ty = N->getValueType(0);
// Replace vector shifts with their X86 specific equivalent so we don't
// need 2 sets of patterns.
- if (!N->getValueType(0).isVector())
+ if (!Ty.isVector())
+ break;
+
+ // Per discussion in #85681, `%c = shl <X x i1> %a, %b -> %c = %a`,
+ // aka, replace all `%c` with `%a` and erase this instruction.
+ if (Ty.getVectorElementType().getFixedSizeInBits() == 1) {
+ CurDAG->ReplaceAllUsesOfValueWith(SDValue(N, 0), N->getOperand(0));
+ CurDAG->DeleteNode(N);
break;
+ }
unsigned NewOpc;
switch (N->getOpcode()) {
diff --git a/llvm/test/CodeGen/X86/pr85681.ll b/llvm/test/CodeGen/X86/pr85681.ll
new file mode 100644
index 00000000000000..8958d60cc561ea
--- /dev/null
+++ b/llvm/test/CodeGen/X86/pr85681.ll
@@ -0,0 +1,39 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
+; RUN: llc < %s -mtriple=x86_64-- -mcpu=emeraldrapids | FileCheck %s
+; RUN: llc < %s -mtriple=x86_64-- -mcpu=sapphirerapids | FileCheck %s
+; RUN: llc < %s -mtriple=x86_64-- -mcpu=znver4 | FileCheck %s
+
+define i32 @shl(i32 %a0) {
+; CHECK-LABEL: shl:
+; CHECK: # %bb.0:
+; CHECK-NEXT: kxnord %k0, %k0, %k0
+; CHECK-NEXT: kmovd %k0, %eax
+; CHECK-NEXT: retq
+ %v0 = bitcast i32 %a0 to <32 x i1>
+ %s = shl <32 x i1> <i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true>, %v0
+ %r = bitcast <32 x i1> %s to i32
+ ret i32 %r
+}
+
+define i32 @lshr(i32 %a0) {
+; CHECK-LABEL: lshr:
+; CHECK: # %bb.0:
+; CHECK-NEXT: movl $-1, %eax
+; CHECK-NEXT: retq
+ %v0 = bitcast i32 %a0 to <32 x i1>
+ %s = lshr <32 x i1> <i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true>, %v0
+ %r = bitcast <32 x i1> %s to i32
+ ret i32 %r
+}
+
+
+define i32 @ashr(i32 %a0) {
+; CHECK-LABEL: ashr:
+; CHECK: # %bb.0:
+; CHECK-NEXT: movl $-1, %eax
+; CHECK-NEXT: retq
+ %v0 = bitcast i32 %a0 to <32 x i1>
+ %s = ashr <32 x i1> <i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true>, %v0
+ %r = bitcast <32 x i1> %s to i32
+ ret i32 %r
+}
``````````
</details>
https://github.com/llvm/llvm-project/pull/85848
More information about the llvm-commits
mailing list