[llvm] 5ad9adb - [Hexagon] Add missing patterns for boolean [v]selects

Krzysztof Parzyszek via llvm-commits llvm-commits at lists.llvm.org
Sat Jun 17 17:22:45 PDT 2023


Author: Krzysztof Parzyszek
Date: 2023-06-17T17:15:07-07:00
New Revision: 5ad9adb9b0ac1c788dee2e1d56850dc4a4d58f4e

URL: https://github.com/llvm/llvm-project/commit/5ad9adb9b0ac1c788dee2e1d56850dc4a4d58f4e
DIFF: https://github.com/llvm/llvm-project/commit/5ad9adb9b0ac1c788dee2e1d56850dc4a4d58f4e.diff

LOG: [Hexagon] Add missing patterns for boolean [v]selects

Fixes https://github.com/llvm/llvm-project/issues/59663

Added: 
    llvm/test/CodeGen/Hexagon/isel/select-i1.ll

Modified: 
    llvm/lib/Target/Hexagon/HexagonPatterns.td

Removed: 
    


################################################################################
diff  --git a/llvm/lib/Target/Hexagon/HexagonPatterns.td b/llvm/lib/Target/Hexagon/HexagonPatterns.td
index 47cdf8759a166..d03c39d949ffc 100644
--- a/llvm/lib/Target/Hexagon/HexagonPatterns.td
+++ b/llvm/lib/Target/Hexagon/HexagonPatterns.td
@@ -978,10 +978,22 @@ def: Pat<(vselect (pnot V2I1:$Pu), V2I32:$Rs, V2I32:$Rt),
 
 
 // From LegalizeDAG.cpp: (Pu ? Pv : Pw) <=> (Pu & Pv) | (!Pu & Pw).
-def: Pat<(select I1:$Pu, I1:$Pv, I1:$Pw),
-         (C2_or (C2_and  I1:$Pu, I1:$Pv),
-                (C2_andn I1:$Pw, I1:$Pu))>;
-
+def: Pat<(select I1:$Pu, I1:$Ps, I1:$Pt),
+         (C4_or_andn (C2_and $Ps, $Pu), $Pt, $Pu)>;
+
+def: Pat<(vselect V2I1:$Pu, V2I1:$Ps, V2I1:$Pt),
+         (C4_or_andn (C2_and $Ps, $Pu), $Pt, $Pu)>;
+def: Pat<(vselect V4I1:$Pu, V4I1:$Ps, V4I1:$Pt),
+         (C4_or_andn (C2_and $Ps, $Pu), $Pt, $Pu)>;
+def: Pat<(vselect V8I1:$Pu, V8I1:$Ps, V8I1:$Pt),
+         (C4_or_andn (C2_and $Ps, $Pu), $Pt, $Pu)>;
+
+def: Pat<(select I1:$Pu, V2I1:$Ps, V2I1:$Pt),
+         (C2_tfrrp (C2_mux $Pu, (C2_tfrpr $Ps), (C2_tfrpr $Pt)))>;
+def: Pat<(select I1:$Pu, V4I1:$Ps, V4I1:$Pt),
+         (C2_tfrrp (C2_mux $Pu, (C2_tfrpr $Ps), (C2_tfrpr $Pt)))>;
+def: Pat<(select I1:$Pu, V8I1:$Ps, V8I1:$Pt),
+         (C2_tfrrp (C2_mux $Pu, (C2_tfrpr $Ps), (C2_tfrpr $Pt)))>;
 
 def IsPosHalf : PatLeaf<(i32 IntRegs:$a), [{
   return isPositiveHalfWord(N);

diff  --git a/llvm/test/CodeGen/Hexagon/isel/select-i1.ll b/llvm/test/CodeGen/Hexagon/isel/select-i1.ll
new file mode 100644
index 0000000000000..d480b7a168361
--- /dev/null
+++ b/llvm/test/CodeGen/Hexagon/isel/select-i1.ll
@@ -0,0 +1,224 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 2
+; RUN: llc -march=hexagon < %s | FileCheck %s
+
+define void @f0(ptr %a0, ptr %a1, ptr %a2, ptr %a3) {
+; CHECK-LABEL: f0:
+; CHECK:         .cfi_startproc
+; CHECK-NEXT:  // %bb.0: // %b0
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r0 = memub(r0+#0)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     p0 = r0
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r0 = mux(p0,r1,r2)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r0 = memub(r0+#0)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     p0 = r0
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r0 = mux(p0,#1,#0)
+; CHECK-NEXT:     jumpr r31
+; CHECK-NEXT:     memb(r3+#0) = r0.new
+; CHECK-NEXT:    }
+b0:
+  %v0 = load i1, ptr %a0
+  %v1 = load i1, ptr %a1
+  %v2 = load i1, ptr %a2
+  %v3 = select i1 %v0, i1 %v1, i1 %v2
+  store i1 %v3, ptr %a3
+  ret void
+}
+
+define void @f1(ptr %a0, ptr %a1, ptr %a2, ptr %a3) {
+; CHECK-LABEL: f1:
+; CHECK:         .cfi_startproc
+; CHECK-NEXT:  // %bb.0: // %b0
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r0 = memub(r0+#0)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     p0 = r0
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r0 = mux(p0,r1,r2)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     jumpr r31
+; CHECK-NEXT:     r0 = memub(r0+#0)
+; CHECK-NEXT:     memb(r3+#0) = r0.new
+; CHECK-NEXT:    }
+b0:
+  %v0 = load i1, ptr %a0
+  %v1 = load <2 x i1>, ptr %a1
+  %v2 = load <2 x i1>, ptr %a2
+  %v3 = select i1 %v0, <2 x i1> %v1, <2 x i1> %v2
+  store <2 x i1> %v3, ptr %a3
+  ret void
+}
+
+define void @f2(ptr %a0, ptr %a1, ptr %a2, ptr %a3) {
+; CHECK-LABEL: f2:
+; CHECK:         .cfi_startproc
+; CHECK-NEXT:  // %bb.0: // %b0
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r0 = memub(r0+#0)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     p0 = r0
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r0 = mux(p0,r1,r2)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     jumpr r31
+; CHECK-NEXT:     r0 = memub(r0+#0)
+; CHECK-NEXT:     memb(r3+#0) = r0.new
+; CHECK-NEXT:    }
+b0:
+  %v0 = load i1, ptr %a0
+  %v1 = load <4 x i1>, ptr %a1
+  %v2 = load <4 x i1>, ptr %a2
+  %v3 = select i1 %v0, <4 x i1> %v1, <4 x i1> %v2
+  store <4 x i1> %v3, ptr %a3
+  ret void
+}
+
+define void @f3(ptr %a0, ptr %a1, ptr %a2, ptr %a3) {
+; CHECK-LABEL: f3:
+; CHECK:         .cfi_startproc
+; CHECK-NEXT:  // %bb.0: // %b0
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r0 = memub(r0+#0)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     p0 = r0
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r0 = mux(p0,r1,r2)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     jumpr r31
+; CHECK-NEXT:     r0 = memub(r0+#0)
+; CHECK-NEXT:     memb(r3+#0) = r0.new
+; CHECK-NEXT:    }
+b0:
+  %v0 = load i1, ptr %a0
+  %v1 = load <8 x i1>, ptr %a1
+  %v2 = load <8 x i1>, ptr %a2
+  %v3 = select i1 %v0, <8 x i1> %v1, <8 x i1> %v2
+  store <8 x i1> %v3, ptr %a3
+  ret void
+}
+
+define void @f4(ptr %a0, ptr %a1, ptr %a2, ptr %a3) {
+; CHECK-LABEL: f4:
+; CHECK:         .cfi_startproc
+; CHECK-NEXT:  // %bb.0: // %b0
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r1 = memub(r1+#0)
+; CHECK-NEXT:     r0 = memub(r0+#0)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r2 = memub(r2+#0)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     p0 = r0
+; CHECK-NEXT:     p1 = r1
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     p2 = r2
+; CHECK-NEXT:     p1 = and(p1,p0)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     p0 = or(p1,and(p2,!p0))
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r2 = p0
+; CHECK-NEXT:     jumpr r31
+; CHECK-NEXT:     memb(r3+#0) = r2.new
+; CHECK-NEXT:    }
+b0:
+  %v0 = load <2 x i1>, ptr %a0
+  %v1 = load <2 x i1>, ptr %a1
+  %v2 = load <2 x i1>, ptr %a2
+  %v3 = select <2 x i1> %v0, <2 x i1> %v1, <2 x i1> %v2
+  store <2 x i1> %v3, ptr %a3
+  ret void
+}
+
+define void @f5(ptr %a0, ptr %a1, ptr %a2, ptr %a3) {
+; CHECK-LABEL: f5:
+; CHECK:         .cfi_startproc
+; CHECK-NEXT:  // %bb.0: // %b0
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r1 = memub(r1+#0)
+; CHECK-NEXT:     r0 = memub(r0+#0)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r2 = memub(r2+#0)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     p0 = r0
+; CHECK-NEXT:     p1 = r1
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     p2 = r2
+; CHECK-NEXT:     p1 = and(p1,p0)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     p0 = or(p1,and(p2,!p0))
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r2 = p0
+; CHECK-NEXT:     jumpr r31
+; CHECK-NEXT:     memb(r3+#0) = r2.new
+; CHECK-NEXT:    }
+b0:
+  %v0 = load <4 x i1>, ptr %a0
+  %v1 = load <4 x i1>, ptr %a1
+  %v2 = load <4 x i1>, ptr %a2
+  %v3 = select <4 x i1> %v0, <4 x i1> %v1, <4 x i1> %v2
+  store <4 x i1> %v3, ptr %a3
+  ret void
+}
+
+define void @f6(ptr %a0, ptr %a1, ptr %a2, ptr %a3) {
+; CHECK-LABEL: f6:
+; CHECK:         .cfi_startproc
+; CHECK-NEXT:  // %bb.0: // %b0
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r1 = memub(r1+#0)
+; CHECK-NEXT:     r0 = memub(r0+#0)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r2 = memub(r2+#0)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     p0 = r0
+; CHECK-NEXT:     p1 = r1
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     p2 = r2
+; CHECK-NEXT:     p1 = and(p1,p0)
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     p0 = or(p1,and(p2,!p0))
+; CHECK-NEXT:    }
+; CHECK-NEXT:    {
+; CHECK-NEXT:     r2 = p0
+; CHECK-NEXT:     jumpr r31
+; CHECK-NEXT:     memb(r3+#0) = r2.new
+; CHECK-NEXT:    }
+b0:
+  %v0 = load <8 x i1>, ptr %a0
+  %v1 = load <8 x i1>, ptr %a1
+  %v2 = load <8 x i1>, ptr %a2
+  %v3 = select <8 x i1> %v0, <8 x i1> %v1, <8 x i1> %v2
+  store <8 x i1> %v3, ptr %a3
+  ret void
+}


        


More information about the llvm-commits mailing list