[llvm] d679dc7 - [Hexagon]Handle truncate of v4i8/v2i16 -> v4i1/v2i1 when Hvx is enabled (#147476)

via llvm-commits llvm-commits at lists.llvm.org
Fri Jul 11 01:27:12 PDT 2025


Author: pkarveti
Date: 2025-07-11T01:27:07-07:00
New Revision: d679dc78229ccc9060374b58c1fa911e2c4a1335

URL: https://github.com/llvm/llvm-project/commit/d679dc78229ccc9060374b58c1fa911e2c4a1335
DIFF: https://github.com/llvm/llvm-project/commit/d679dc78229ccc9060374b58c1fa911e2c4a1335.diff

LOG: [Hexagon]Handle truncate of v4i8/v2i16 -> v4i1/v2i1 when Hvx is enabled (#147476)

Added: 
    

Modified: 
    llvm/lib/Target/Hexagon/HexagonPatterns.td
    llvm/test/CodeGen/Hexagon/isel/trunc-vNi1.ll

Removed: 
    


################################################################################
diff  --git a/llvm/lib/Target/Hexagon/HexagonPatterns.td b/llvm/lib/Target/Hexagon/HexagonPatterns.td
index 2a991bafbf148..4d15cfa651270 100644
--- a/llvm/lib/Target/Hexagon/HexagonPatterns.td
+++ b/llvm/lib/Target/Hexagon/HexagonPatterns.td
@@ -582,6 +582,13 @@ def: Pat<(v8i1 (trunc V8I8:$Rs)),
          (A4_vcmpbeqi (Combinew (A2_andir (HiReg $Rs), (i32 0x01010101)),
                                 (A2_andir (LoReg $Rs), (i32 0x01010101))),
                       (i32 1))>;
+def : Pat<(v4i1 (trunc V4I8:$Rs)),
+          (A4_vcmpheqi (Combinew (A2_andir (HiReg (S2_vzxtbh $Rs)), 0x00010001),
+                                 (A2_andir (LoReg (S2_vzxtbh $Rs)), 0x00010001)),
+                       (i32 1))>;
+def: Pat<(v2i1 (trunc V2I16:$Rs)),
+          (A4_vcmpweqi (A2_andp (S2_vzxthw $Rs), (A2_combineii (i32 1), (i32 1))),
+                      (i32 1))>;
 
 
 // Saturation:

diff  --git a/llvm/test/CodeGen/Hexagon/isel/trunc-vNi1.ll b/llvm/test/CodeGen/Hexagon/isel/trunc-vNi1.ll
index 1090b64fcad52..c91f16d91d1be 100644
--- a/llvm/test/CodeGen/Hexagon/isel/trunc-vNi1.ll
+++ b/llvm/test/CodeGen/Hexagon/isel/trunc-vNi1.ll
@@ -1,24 +1,11 @@
-; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 2
 ; RUN: llc -mtriple=hexagon < %s | FileCheck %s
+; RUN: llc --mtriple=hexagon -mattr=+hvxv79,+hvx-length128b < %s | FileCheck %s
 
 define void @f0(<2 x i32> %a0, ptr %a1) {
 ; CHECK-LABEL: f0:
-; CHECK:         .cfi_startproc
-; CHECK-NEXT:  // %bb.0: // %b0
-; CHECK-NEXT:    {
-; CHECK-NEXT:     r5:4 = combine(#1,#1)
-; CHECK-NEXT:    }
-; CHECK-NEXT:    {
-; CHECK-NEXT:     r1:0 = and(r1:0,r5:4)
-; CHECK-NEXT:    }
-; CHECK-NEXT:    {
-; CHECK-NEXT:     p0 = vcmpw.eq(r1:0,#1)
-; CHECK-NEXT:    }
-; CHECK-NEXT:    {
-; CHECK-NEXT:     r0 = p0
-; CHECK-NEXT:     jumpr r31
-; CHECK-NEXT:     memb(r2+#0) = r0.new
-; CHECK-NEXT:    }
+; CHECK: r[[REG1H:([0-9]+)]]:[[REG1L:([0-9]+)]] = combine(#1,#1)
+; CHECK: r[[REG2H:([0-9]+)]]:[[REG2L:([0-9]+)]] = and(r[[REG2H]]:[[REG2L]],r[[REG1H]]:[[REG1L]])
+; CHECK: p{{[0-9]+}} = vcmpw.eq(r[[REG2H]]:[[REG2L]],#1)
 b0:
   %v0 = trunc <2 x i32> %a0 to <2 x i1>
   store <2 x i1> %v0, ptr %a1, align 1
@@ -27,20 +14,9 @@ b0:
 
 define void @f1(<4 x i16> %a0, ptr %a1) {
 ; CHECK-LABEL: f1:
-; CHECK:         .cfi_startproc
-; CHECK-NEXT:  // %bb.0: // %b0
-; CHECK-NEXT:    {
-; CHECK-NEXT:     r0 = and(r0,##65537)
-; CHECK-NEXT:     r1 = and(r1,##65537)
-; CHECK-NEXT:    }
-; CHECK-NEXT:    {
-; CHECK-NEXT:     p0 = vcmph.eq(r1:0,#1)
-; CHECK-NEXT:    }
-; CHECK-NEXT:    {
-; CHECK-NEXT:     r0 = p0
-; CHECK-NEXT:     jumpr r31
-; CHECK-NEXT:     memb(r2+#0) = r0.new
-; CHECK-NEXT:    }
+; CHECK: [[REG0:r([0-9]+)]] = and([[REG0]],##65537)
+; CHECK: [[REG1:r([0-9]+)]] = and([[REG1]],##65537)
+; CHECK: p{{[0-9]+}} = vcmph.eq(r{{[0-9]+}}:{{[0-9]+}},#1)
 b0:
   %v0 = trunc <4 x i16> %a0 to <4 x i1>
   store <4 x i1> %v0, ptr %a1, align 1
@@ -49,22 +25,35 @@ b0:
 
 define void @f2(<8 x i8> %a0, ptr %a1) {
 ; CHECK-LABEL: f2:
-; CHECK:         .cfi_startproc
-; CHECK-NEXT:  // %bb.0: // %b0
-; CHECK-NEXT:    {
-; CHECK-NEXT:     r0 = and(r0,##16843009)
-; CHECK-NEXT:     r1 = and(r1,##16843009)
-; CHECK-NEXT:    }
-; CHECK-NEXT:    {
-; CHECK-NEXT:     p0 = vcmpb.eq(r1:0,#1)
-; CHECK-NEXT:    }
-; CHECK-NEXT:    {
-; CHECK-NEXT:     r0 = p0
-; CHECK-NEXT:     jumpr r31
-; CHECK-NEXT:     memb(r2+#0) = r0.new
-; CHECK-NEXT:    }
+; CHECK: [[REG0:r([0-9]+)]] = and([[REG0]],##16843009)
+; CHECK: [[REG1:r([0-9]+)]] = and([[REG1]],##16843009)
+; CHECK: p{{[0-9]+}} = vcmpb.eq(r{{[0-9]+}}:{{[0-9]+}},#1)
 b0:
   %v0 = trunc <8 x i8> %a0 to <8 x i1>
   store <8 x i1> %v0, ptr %a1, align 1
   ret void
 }
+
+define void @f3(<4 x i8> %a0, ptr %a1) {
+; CHECK-LABEL: f3:
+; CHECK: r[[REGH:([0-9]+)]]:[[REGL:([0-9]+)]] = vzxtbh(r{{[0-9]+}})
+; CHECK: r[[REGL]] = and(r[[REGL]],##65537)
+; CHECK: r[[REGH]] = and(r[[REGH]],##65537)
+; CHECK: p{{[0-9]+}} = vcmph.eq(r[[REGH]]:[[REGL]],#1)
+b0:
+  %v0 = trunc <4 x i8> %a0 to <4 x i1>
+  store <4 x i1> %v0, ptr %a1, align 1
+  ret void
+}
+
+define void @f4(<2 x i16> %a0, ptr %a1) {
+; CHECK-LABEL: f4:
+; CHECK: r[[REGH:([0-9]+)]]:[[REGL:([0-9]+)]] = vzxthw(r{{[0-9]+}})
+; CHECK: r[[REG1H:([0-9]+)]]:[[REG1L:([0-9]+)]] = combine(#1,#1)
+; CHECK: r[[REGH]]:[[REGL]] = and(r[[REGH]]:[[REGL]],r[[REG1H]]:[[REG1L]])
+; CHECK: p{{[0-9]+}} = vcmpw.eq(r[[REGH]]:[[REGL]],#1)
+b0:
+  %v0 = trunc <2 x i16> %a0 to <2 x i1>
+  store <2 x i1> %v0, ptr %a1, align 1
+  ret void
+}


        


More information about the llvm-commits mailing list