[llvm] [RISCV] Add short forward branch support for `min`, `max`, `maxu` and `minu` (PR #164394)

via llvm-commits llvm-commits at lists.llvm.org
Tue Oct 21 03:47:37 PDT 2025


https://github.com/hchandel created https://github.com/llvm/llvm-project/pull/164394

None

>From c1cb8b072a2e0051bd15868f0817c95d028d5077 Mon Sep 17 00:00:00 2001
From: Harsh Chandel <hchandel at qti.qualcomm.com>
Date: Thu, 16 Oct 2025 14:24:55 +0530
Subject: [PATCH 1/2] SFB with max

Change-Id: I7585f98422bf4b101fd44b1b4d6bc8584ca8cb53
---
 llvm/lib/Target/RISCV/RISCVExpandPseudoInsts.cpp | 2 ++
 llvm/lib/Target/RISCV/RISCVInstrInfo.cpp         | 1 +
 llvm/lib/Target/RISCV/RISCVInstrInfoSFB.td       | 1 +
 3 files changed, 4 insertions(+)

diff --git a/llvm/lib/Target/RISCV/RISCVExpandPseudoInsts.cpp b/llvm/lib/Target/RISCV/RISCVExpandPseudoInsts.cpp
index 410561855e181..ff96ed9a6b5d0 100644
--- a/llvm/lib/Target/RISCV/RISCVExpandPseudoInsts.cpp
+++ b/llvm/lib/Target/RISCV/RISCVExpandPseudoInsts.cpp
@@ -127,6 +127,7 @@ bool RISCVExpandPseudo::expandMI(MachineBasicBlock &MBB,
   case RISCV::PseudoCCAND:
   case RISCV::PseudoCCOR:
   case RISCV::PseudoCCXOR:
+  case RISCV::PseudoCCMAX:
   case RISCV::PseudoCCADDW:
   case RISCV::PseudoCCSUBW:
   case RISCV::PseudoCCSLL:
@@ -228,6 +229,7 @@ bool RISCVExpandPseudo::expandCCOp(MachineBasicBlock &MBB,
     case RISCV::PseudoCCAND:   NewOpc = RISCV::AND;   break;
     case RISCV::PseudoCCOR:    NewOpc = RISCV::OR;    break;
     case RISCV::PseudoCCXOR:   NewOpc = RISCV::XOR;   break;
+    case RISCV::PseudoCCMAX:   NewOpc = RISCV::MAX;   break;
     case RISCV::PseudoCCADDI:  NewOpc = RISCV::ADDI;  break;
     case RISCV::PseudoCCSLLI:  NewOpc = RISCV::SLLI;  break;
     case RISCV::PseudoCCSRLI:  NewOpc = RISCV::SRLI;  break;
diff --git a/llvm/lib/Target/RISCV/RISCVInstrInfo.cpp b/llvm/lib/Target/RISCV/RISCVInstrInfo.cpp
index 96e1078467f19..c27a96305f1c0 100644
--- a/llvm/lib/Target/RISCV/RISCVInstrInfo.cpp
+++ b/llvm/lib/Target/RISCV/RISCVInstrInfo.cpp
@@ -1698,6 +1698,7 @@ unsigned getPredicatedOpcode(unsigned Opcode) {
   case RISCV::AND:   return RISCV::PseudoCCAND;   break;
   case RISCV::OR:    return RISCV::PseudoCCOR;    break;
   case RISCV::XOR:   return RISCV::PseudoCCXOR;   break;
+  case RISCV::MAX:   return RISCV::PseudoCCMAX;   break;
 
   case RISCV::ADDI:  return RISCV::PseudoCCADDI;  break;
   case RISCV::SLLI:  return RISCV::PseudoCCSLLI;  break;
diff --git a/llvm/lib/Target/RISCV/RISCVInstrInfoSFB.td b/llvm/lib/Target/RISCV/RISCVInstrInfoSFB.td
index 0114fbdc56302..5ca145d6c458c 100644
--- a/llvm/lib/Target/RISCV/RISCVInstrInfoSFB.td
+++ b/llvm/lib/Target/RISCV/RISCVInstrInfoSFB.td
@@ -106,6 +106,7 @@ def PseudoCCSRA : SFBALU_rr;
 def PseudoCCAND : SFBALU_rr;
 def PseudoCCOR  : SFBALU_rr;
 def PseudoCCXOR : SFBALU_rr;
+def PseudoCCMAX : SFBALU_rr;
 
 def PseudoCCADDI : SFBALU_ri;
 def PseudoCCANDI : SFBALU_ri;

>From a28faada306dac91eb7aff718e19b8fc89c6b1ba Mon Sep 17 00:00:00 2001
From: Harsh Chandel <hchandel at qti.qualcomm.com>
Date: Tue, 21 Oct 2025 11:44:07 +0530
Subject: [PATCH 2/2] SFB with min, maxu and minu

Change-Id: I5a2deafae906b518f3379b2c4ba625cf0a76df79
---
 .../Target/RISCV/RISCVExpandPseudoInsts.cpp   |   6 +
 llvm/lib/Target/RISCV/RISCVInstrInfo.cpp      |   3 +
 llvm/lib/Target/RISCV/RISCVInstrInfoSFB.td    |   3 +
 .../RISCV/short-forward-branch-opt-min-max.ll | 539 ++++++++++++++++++
 4 files changed, 551 insertions(+)
 create mode 100644 llvm/test/CodeGen/RISCV/short-forward-branch-opt-min-max.ll

diff --git a/llvm/lib/Target/RISCV/RISCVExpandPseudoInsts.cpp b/llvm/lib/Target/RISCV/RISCVExpandPseudoInsts.cpp
index ff96ed9a6b5d0..567a8da50a1db 100644
--- a/llvm/lib/Target/RISCV/RISCVExpandPseudoInsts.cpp
+++ b/llvm/lib/Target/RISCV/RISCVExpandPseudoInsts.cpp
@@ -128,6 +128,9 @@ bool RISCVExpandPseudo::expandMI(MachineBasicBlock &MBB,
   case RISCV::PseudoCCOR:
   case RISCV::PseudoCCXOR:
   case RISCV::PseudoCCMAX:
+  case RISCV::PseudoCCMAXU:
+  case RISCV::PseudoCCMIN:
+  case RISCV::PseudoCCMINU:
   case RISCV::PseudoCCADDW:
   case RISCV::PseudoCCSUBW:
   case RISCV::PseudoCCSLL:
@@ -230,6 +233,9 @@ bool RISCVExpandPseudo::expandCCOp(MachineBasicBlock &MBB,
     case RISCV::PseudoCCOR:    NewOpc = RISCV::OR;    break;
     case RISCV::PseudoCCXOR:   NewOpc = RISCV::XOR;   break;
     case RISCV::PseudoCCMAX:   NewOpc = RISCV::MAX;   break;
+    case RISCV::PseudoCCMIN:   NewOpc = RISCV::MIN;   break;
+    case RISCV::PseudoCCMAXU:  NewOpc = RISCV::MAXU;  break;
+    case RISCV::PseudoCCMINU:  NewOpc = RISCV::MINU;  break;
     case RISCV::PseudoCCADDI:  NewOpc = RISCV::ADDI;  break;
     case RISCV::PseudoCCSLLI:  NewOpc = RISCV::SLLI;  break;
     case RISCV::PseudoCCSRLI:  NewOpc = RISCV::SRLI;  break;
diff --git a/llvm/lib/Target/RISCV/RISCVInstrInfo.cpp b/llvm/lib/Target/RISCV/RISCVInstrInfo.cpp
index 8b2eb3af59c4e..435df1e4b91b6 100644
--- a/llvm/lib/Target/RISCV/RISCVInstrInfo.cpp
+++ b/llvm/lib/Target/RISCV/RISCVInstrInfo.cpp
@@ -1699,6 +1699,9 @@ unsigned getPredicatedOpcode(unsigned Opcode) {
   case RISCV::OR:    return RISCV::PseudoCCOR;    break;
   case RISCV::XOR:   return RISCV::PseudoCCXOR;   break;
   case RISCV::MAX:   return RISCV::PseudoCCMAX;   break;
+  case RISCV::MAXU:  return RISCV::PseudoCCMAXU;  break;
+  case RISCV::MIN:   return RISCV::PseudoCCMIN;   break;
+  case RISCV::MINU:  return RISCV::PseudoCCMINU;  break;
 
   case RISCV::ADDI:  return RISCV::PseudoCCADDI;  break;
   case RISCV::SLLI:  return RISCV::PseudoCCSLLI;  break;
diff --git a/llvm/lib/Target/RISCV/RISCVInstrInfoSFB.td b/llvm/lib/Target/RISCV/RISCVInstrInfoSFB.td
index 5ca145d6c458c..5a67a5aaba293 100644
--- a/llvm/lib/Target/RISCV/RISCVInstrInfoSFB.td
+++ b/llvm/lib/Target/RISCV/RISCVInstrInfoSFB.td
@@ -107,6 +107,9 @@ def PseudoCCAND : SFBALU_rr;
 def PseudoCCOR  : SFBALU_rr;
 def PseudoCCXOR : SFBALU_rr;
 def PseudoCCMAX : SFBALU_rr;
+def PseudoCCMIN : SFBALU_rr;
+def PseudoCCMAXU : SFBALU_rr;
+def PseudoCCMINU : SFBALU_rr;
 
 def PseudoCCADDI : SFBALU_ri;
 def PseudoCCANDI : SFBALU_ri;
diff --git a/llvm/test/CodeGen/RISCV/short-forward-branch-opt-min-max.ll b/llvm/test/CodeGen/RISCV/short-forward-branch-opt-min-max.ll
new file mode 100644
index 0000000000000..9fa4e350aced9
--- /dev/null
+++ b/llvm/test/CodeGen/RISCV/short-forward-branch-opt-min-max.ll
@@ -0,0 +1,539 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 6
+; RUN: llc < %s -mtriple=riscv32 | FileCheck %s --check-prefixes=RV32I-NOZBB
+; RUN: llc < %s -mtriple=riscv64 | FileCheck %s --check-prefixes=RV64I-NOZBB
+; RUN: llc < %s -mtriple=riscv32 -mattr=+zbb,+short-forward-branch-opt | \
+; RUN:   FileCheck %s --check-prefixes=RV32I-SFB-ZBB
+; RUN: llc < %s -mtriple=riscv64 -mattr=+zbb,+short-forward-branch-opt | \
+; RUN:   FileCheck %s --check-prefixes=RV64I-SFB-ZBB
+
+define i32 @select_example_smax(i32 %a, i32 %b, i1 zeroext %x, i32 %y) {
+; RV32I-NOZBB-LABEL: select_example_smax:
+; RV32I-NOZBB:       # %bb.0: # %entry
+; RV32I-NOZBB-NEXT:    bge a3, a0, .LBB0_3
+; RV32I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV32I-NOZBB-NEXT:    beqz a2, .LBB0_4
+; RV32I-NOZBB-NEXT:  .LBB0_2: # %entry
+; RV32I-NOZBB-NEXT:    ret
+; RV32I-NOZBB-NEXT:  .LBB0_3: # %entry
+; RV32I-NOZBB-NEXT:    mv a0, a3
+; RV32I-NOZBB-NEXT:    bnez a2, .LBB0_2
+; RV32I-NOZBB-NEXT:  .LBB0_4: # %entry
+; RV32I-NOZBB-NEXT:    mv a0, a1
+; RV32I-NOZBB-NEXT:    ret
+;
+; RV64I-NOZBB-LABEL: select_example_smax:
+; RV64I-NOZBB:       # %bb.0: # %entry
+; RV64I-NOZBB-NEXT:    sext.w a0, a0
+; RV64I-NOZBB-NEXT:    sext.w a3, a3
+; RV64I-NOZBB-NEXT:    bge a3, a0, .LBB0_3
+; RV64I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV64I-NOZBB-NEXT:    beqz a2, .LBB0_4
+; RV64I-NOZBB-NEXT:  .LBB0_2: # %entry
+; RV64I-NOZBB-NEXT:    ret
+; RV64I-NOZBB-NEXT:  .LBB0_3: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a3
+; RV64I-NOZBB-NEXT:    bnez a2, .LBB0_2
+; RV64I-NOZBB-NEXT:  .LBB0_4: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a1
+; RV64I-NOZBB-NEXT:    ret
+;
+; RV32I-SFB-ZBB-LABEL: select_example_smax:
+; RV32I-SFB-ZBB:       # %bb.0: # %entry
+; RV32I-SFB-ZBB-NEXT:    beqz a2, .LBB0_2
+; RV32I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV32I-SFB-ZBB-NEXT:    max a1, a0, a3
+; RV32I-SFB-ZBB-NEXT:  .LBB0_2: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a0, a1
+; RV32I-SFB-ZBB-NEXT:    ret
+;
+; RV64I-SFB-ZBB-LABEL: select_example_smax:
+; RV64I-SFB-ZBB:       # %bb.0: # %entry
+; RV64I-SFB-ZBB-NEXT:    sext.w a3, a3
+; RV64I-SFB-ZBB-NEXT:    sext.w a0, a0
+; RV64I-SFB-ZBB-NEXT:    beqz a2, .LBB0_2
+; RV64I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV64I-SFB-ZBB-NEXT:    max a1, a0, a3
+; RV64I-SFB-ZBB-NEXT:  .LBB0_2: # %entry
+; RV64I-SFB-ZBB-NEXT:    mv a0, a1
+; RV64I-SFB-ZBB-NEXT:    ret
+entry:
+  %res = call i32 @llvm.smax.i32(i32 %a, i32 %y)
+  %sel = select i1 %x, i32 %res, i32 %b
+  ret i32 %sel
+}
+
+define i32 @select_example_smin(i32 %a, i32 %b, i1 zeroext %x, i32 %y) {
+; RV32I-NOZBB-LABEL: select_example_smin:
+; RV32I-NOZBB:       # %bb.0: # %entry
+; RV32I-NOZBB-NEXT:    bge a0, a3, .LBB1_3
+; RV32I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV32I-NOZBB-NEXT:    beqz a2, .LBB1_4
+; RV32I-NOZBB-NEXT:  .LBB1_2: # %entry
+; RV32I-NOZBB-NEXT:    ret
+; RV32I-NOZBB-NEXT:  .LBB1_3: # %entry
+; RV32I-NOZBB-NEXT:    mv a0, a3
+; RV32I-NOZBB-NEXT:    bnez a2, .LBB1_2
+; RV32I-NOZBB-NEXT:  .LBB1_4: # %entry
+; RV32I-NOZBB-NEXT:    mv a0, a1
+; RV32I-NOZBB-NEXT:    ret
+;
+; RV64I-NOZBB-LABEL: select_example_smin:
+; RV64I-NOZBB:       # %bb.0: # %entry
+; RV64I-NOZBB-NEXT:    sext.w a3, a3
+; RV64I-NOZBB-NEXT:    sext.w a0, a0
+; RV64I-NOZBB-NEXT:    bge a0, a3, .LBB1_3
+; RV64I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV64I-NOZBB-NEXT:    beqz a2, .LBB1_4
+; RV64I-NOZBB-NEXT:  .LBB1_2: # %entry
+; RV64I-NOZBB-NEXT:    ret
+; RV64I-NOZBB-NEXT:  .LBB1_3: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a3
+; RV64I-NOZBB-NEXT:    bnez a2, .LBB1_2
+; RV64I-NOZBB-NEXT:  .LBB1_4: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a1
+; RV64I-NOZBB-NEXT:    ret
+;
+; RV32I-SFB-ZBB-LABEL: select_example_smin:
+; RV32I-SFB-ZBB:       # %bb.0: # %entry
+; RV32I-SFB-ZBB-NEXT:    beqz a2, .LBB1_2
+; RV32I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV32I-SFB-ZBB-NEXT:    min a1, a0, a3
+; RV32I-SFB-ZBB-NEXT:  .LBB1_2: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a0, a1
+; RV32I-SFB-ZBB-NEXT:    ret
+;
+; RV64I-SFB-ZBB-LABEL: select_example_smin:
+; RV64I-SFB-ZBB:       # %bb.0: # %entry
+; RV64I-SFB-ZBB-NEXT:    sext.w a3, a3
+; RV64I-SFB-ZBB-NEXT:    sext.w a0, a0
+; RV64I-SFB-ZBB-NEXT:    beqz a2, .LBB1_2
+; RV64I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV64I-SFB-ZBB-NEXT:    min a1, a0, a3
+; RV64I-SFB-ZBB-NEXT:  .LBB1_2: # %entry
+; RV64I-SFB-ZBB-NEXT:    mv a0, a1
+; RV64I-SFB-ZBB-NEXT:    ret
+entry:
+  %res = call i32 @llvm.smin.i32(i32 %a, i32 %y)
+  %sel = select i1 %x, i32 %res, i32 %b
+  ret i32 %sel
+}
+
+define i32 @select_example_umax(i32 %a, i32 %b, i1 zeroext %x, i32 %y) {
+; RV32I-NOZBB-LABEL: select_example_umax:
+; RV32I-NOZBB:       # %bb.0: # %entry
+; RV32I-NOZBB-NEXT:    bgeu a3, a0, .LBB2_3
+; RV32I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV32I-NOZBB-NEXT:    beqz a2, .LBB2_4
+; RV32I-NOZBB-NEXT:  .LBB2_2: # %entry
+; RV32I-NOZBB-NEXT:    ret
+; RV32I-NOZBB-NEXT:  .LBB2_3: # %entry
+; RV32I-NOZBB-NEXT:    mv a0, a3
+; RV32I-NOZBB-NEXT:    bnez a2, .LBB2_2
+; RV32I-NOZBB-NEXT:  .LBB2_4: # %entry
+; RV32I-NOZBB-NEXT:    mv a0, a1
+; RV32I-NOZBB-NEXT:    ret
+;
+; RV64I-NOZBB-LABEL: select_example_umax:
+; RV64I-NOZBB:       # %bb.0: # %entry
+; RV64I-NOZBB-NEXT:    sext.w a0, a0
+; RV64I-NOZBB-NEXT:    sext.w a3, a3
+; RV64I-NOZBB-NEXT:    bgeu a3, a0, .LBB2_3
+; RV64I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV64I-NOZBB-NEXT:    beqz a2, .LBB2_4
+; RV64I-NOZBB-NEXT:  .LBB2_2: # %entry
+; RV64I-NOZBB-NEXT:    ret
+; RV64I-NOZBB-NEXT:  .LBB2_3: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a3
+; RV64I-NOZBB-NEXT:    bnez a2, .LBB2_2
+; RV64I-NOZBB-NEXT:  .LBB2_4: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a1
+; RV64I-NOZBB-NEXT:    ret
+;
+; RV32I-SFB-ZBB-LABEL: select_example_umax:
+; RV32I-SFB-ZBB:       # %bb.0: # %entry
+; RV32I-SFB-ZBB-NEXT:    beqz a2, .LBB2_2
+; RV32I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV32I-SFB-ZBB-NEXT:    maxu a1, a0, a3
+; RV32I-SFB-ZBB-NEXT:  .LBB2_2: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a0, a1
+; RV32I-SFB-ZBB-NEXT:    ret
+;
+; RV64I-SFB-ZBB-LABEL: select_example_umax:
+; RV64I-SFB-ZBB:       # %bb.0: # %entry
+; RV64I-SFB-ZBB-NEXT:    sext.w a3, a3
+; RV64I-SFB-ZBB-NEXT:    sext.w a0, a0
+; RV64I-SFB-ZBB-NEXT:    beqz a2, .LBB2_2
+; RV64I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV64I-SFB-ZBB-NEXT:    maxu a1, a0, a3
+; RV64I-SFB-ZBB-NEXT:  .LBB2_2: # %entry
+; RV64I-SFB-ZBB-NEXT:    mv a0, a1
+; RV64I-SFB-ZBB-NEXT:    ret
+entry:
+  %res = call i32 @llvm.umax.i32(i32 %a, i32 %y)
+  %sel = select i1 %x, i32 %res, i32 %b
+  ret i32 %sel
+}
+
+define i32 @select_example_umin(i32 %a, i32 %b, i1 zeroext %x, i32 %y) {
+; RV32I-NOZBB-LABEL: select_example_umin:
+; RV32I-NOZBB:       # %bb.0: # %entry
+; RV32I-NOZBB-NEXT:    bgeu a0, a3, .LBB3_3
+; RV32I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV32I-NOZBB-NEXT:    beqz a2, .LBB3_4
+; RV32I-NOZBB-NEXT:  .LBB3_2: # %entry
+; RV32I-NOZBB-NEXT:    ret
+; RV32I-NOZBB-NEXT:  .LBB3_3: # %entry
+; RV32I-NOZBB-NEXT:    mv a0, a3
+; RV32I-NOZBB-NEXT:    bnez a2, .LBB3_2
+; RV32I-NOZBB-NEXT:  .LBB3_4: # %entry
+; RV32I-NOZBB-NEXT:    mv a0, a1
+; RV32I-NOZBB-NEXT:    ret
+;
+; RV64I-NOZBB-LABEL: select_example_umin:
+; RV64I-NOZBB:       # %bb.0: # %entry
+; RV64I-NOZBB-NEXT:    sext.w a3, a3
+; RV64I-NOZBB-NEXT:    sext.w a0, a0
+; RV64I-NOZBB-NEXT:    bgeu a0, a3, .LBB3_3
+; RV64I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV64I-NOZBB-NEXT:    beqz a2, .LBB3_4
+; RV64I-NOZBB-NEXT:  .LBB3_2: # %entry
+; RV64I-NOZBB-NEXT:    ret
+; RV64I-NOZBB-NEXT:  .LBB3_3: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a3
+; RV64I-NOZBB-NEXT:    bnez a2, .LBB3_2
+; RV64I-NOZBB-NEXT:  .LBB3_4: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a1
+; RV64I-NOZBB-NEXT:    ret
+;
+; RV32I-SFB-ZBB-LABEL: select_example_umin:
+; RV32I-SFB-ZBB:       # %bb.0: # %entry
+; RV32I-SFB-ZBB-NEXT:    beqz a2, .LBB3_2
+; RV32I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV32I-SFB-ZBB-NEXT:    minu a1, a0, a3
+; RV32I-SFB-ZBB-NEXT:  .LBB3_2: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a0, a1
+; RV32I-SFB-ZBB-NEXT:    ret
+;
+; RV64I-SFB-ZBB-LABEL: select_example_umin:
+; RV64I-SFB-ZBB:       # %bb.0: # %entry
+; RV64I-SFB-ZBB-NEXT:    sext.w a3, a3
+; RV64I-SFB-ZBB-NEXT:    sext.w a0, a0
+; RV64I-SFB-ZBB-NEXT:    beqz a2, .LBB3_2
+; RV64I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV64I-SFB-ZBB-NEXT:    minu a1, a0, a3
+; RV64I-SFB-ZBB-NEXT:  .LBB3_2: # %entry
+; RV64I-SFB-ZBB-NEXT:    mv a0, a1
+; RV64I-SFB-ZBB-NEXT:    ret
+entry:
+  %res = call i32 @llvm.umin.i32(i32 %a, i32 %y)
+  %sel = select i1 %x, i32 %res, i32 %b
+  ret i32 %sel
+}
+
+define i64 @select_example_smax_1(i64 %a, i64 %b, i1 zeroext %x, i64 %y) {
+; RV32I-NOZBB-LABEL: select_example_smax_1:
+; RV32I-NOZBB:       # %bb.0: # %entry
+; RV32I-NOZBB-NEXT:    beq a1, a6, .LBB4_2
+; RV32I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV32I-NOZBB-NEXT:    slt a7, a6, a1
+; RV32I-NOZBB-NEXT:    beqz a7, .LBB4_3
+; RV32I-NOZBB-NEXT:    j .LBB4_4
+; RV32I-NOZBB-NEXT:  .LBB4_2:
+; RV32I-NOZBB-NEXT:    sltu a7, a5, a0
+; RV32I-NOZBB-NEXT:    bnez a7, .LBB4_4
+; RV32I-NOZBB-NEXT:  .LBB4_3: # %entry
+; RV32I-NOZBB-NEXT:    mv a1, a6
+; RV32I-NOZBB-NEXT:    mv a0, a5
+; RV32I-NOZBB-NEXT:  .LBB4_4: # %entry
+; RV32I-NOZBB-NEXT:    beqz a4, .LBB4_6
+; RV32I-NOZBB-NEXT:  # %bb.5: # %entry
+; RV32I-NOZBB-NEXT:    ret
+; RV32I-NOZBB-NEXT:  .LBB4_6: # %entry
+; RV32I-NOZBB-NEXT:    mv a0, a2
+; RV32I-NOZBB-NEXT:    mv a1, a3
+; RV32I-NOZBB-NEXT:    ret
+;
+; RV64I-NOZBB-LABEL: select_example_smax_1:
+; RV64I-NOZBB:       # %bb.0: # %entry
+; RV64I-NOZBB-NEXT:    bge a3, a0, .LBB4_3
+; RV64I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV64I-NOZBB-NEXT:    beqz a2, .LBB4_4
+; RV64I-NOZBB-NEXT:  .LBB4_2: # %entry
+; RV64I-NOZBB-NEXT:    ret
+; RV64I-NOZBB-NEXT:  .LBB4_3: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a3
+; RV64I-NOZBB-NEXT:    bnez a2, .LBB4_2
+; RV64I-NOZBB-NEXT:  .LBB4_4: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a1
+; RV64I-NOZBB-NEXT:    ret
+;
+; RV32I-SFB-ZBB-LABEL: select_example_smax_1:
+; RV32I-SFB-ZBB:       # %bb.0: # %entry
+; RV32I-SFB-ZBB-NEXT:    sltu a7, a5, a0
+; RV32I-SFB-ZBB-NEXT:    slt t0, a6, a1
+; RV32I-SFB-ZBB-NEXT:    bne a1, a6, .LBB4_2
+; RV32I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv t0, a7
+; RV32I-SFB-ZBB-NEXT:  .LBB4_2: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez t0, .LBB4_4
+; RV32I-SFB-ZBB-NEXT:  # %bb.3: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a1, a6
+; RV32I-SFB-ZBB-NEXT:  .LBB4_4: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez t0, .LBB4_6
+; RV32I-SFB-ZBB-NEXT:  # %bb.5: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a0, a5
+; RV32I-SFB-ZBB-NEXT:  .LBB4_6: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez a4, .LBB4_8
+; RV32I-SFB-ZBB-NEXT:  # %bb.7: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a0, a2
+; RV32I-SFB-ZBB-NEXT:  .LBB4_8: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez a4, .LBB4_10
+; RV32I-SFB-ZBB-NEXT:  # %bb.9: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a1, a3
+; RV32I-SFB-ZBB-NEXT:  .LBB4_10: # %entry
+; RV32I-SFB-ZBB-NEXT:    ret
+;
+; RV64I-SFB-ZBB-LABEL: select_example_smax_1:
+; RV64I-SFB-ZBB:       # %bb.0: # %entry
+; RV64I-SFB-ZBB-NEXT:    beqz a2, .LBB4_2
+; RV64I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV64I-SFB-ZBB-NEXT:    max a1, a0, a3
+; RV64I-SFB-ZBB-NEXT:  .LBB4_2: # %entry
+; RV64I-SFB-ZBB-NEXT:    mv a0, a1
+; RV64I-SFB-ZBB-NEXT:    ret
+entry:
+  %res = call i64 @llvm.smax.i64(i64 %a, i64 %y)
+  %sel = select i1 %x, i64 %res, i64 %b
+  ret i64 %sel
+}
+
+define i64 @select_example_smin_1(i64 %a, i64 %b, i1 zeroext %x, i64 %y) {
+; RV32I-NOZBB-LABEL: select_example_smin_1:
+; RV32I-NOZBB:       # %bb.0: # %entry
+; RV32I-NOZBB-NEXT:    beq a1, a6, .LBB5_2
+; RV32I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV32I-NOZBB-NEXT:    slt a7, a1, a6
+; RV32I-NOZBB-NEXT:    beqz a7, .LBB5_3
+; RV32I-NOZBB-NEXT:    j .LBB5_4
+; RV32I-NOZBB-NEXT:  .LBB5_2:
+; RV32I-NOZBB-NEXT:    sltu a7, a0, a5
+; RV32I-NOZBB-NEXT:    bnez a7, .LBB5_4
+; RV32I-NOZBB-NEXT:  .LBB5_3: # %entry
+; RV32I-NOZBB-NEXT:    mv a1, a6
+; RV32I-NOZBB-NEXT:    mv a0, a5
+; RV32I-NOZBB-NEXT:  .LBB5_4: # %entry
+; RV32I-NOZBB-NEXT:    beqz a4, .LBB5_6
+; RV32I-NOZBB-NEXT:  # %bb.5: # %entry
+; RV32I-NOZBB-NEXT:    ret
+; RV32I-NOZBB-NEXT:  .LBB5_6: # %entry
+; RV32I-NOZBB-NEXT:    mv a0, a2
+; RV32I-NOZBB-NEXT:    mv a1, a3
+; RV32I-NOZBB-NEXT:    ret
+;
+; RV64I-NOZBB-LABEL: select_example_smin_1:
+; RV64I-NOZBB:       # %bb.0: # %entry
+; RV64I-NOZBB-NEXT:    bge a0, a3, .LBB5_3
+; RV64I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV64I-NOZBB-NEXT:    beqz a2, .LBB5_4
+; RV64I-NOZBB-NEXT:  .LBB5_2: # %entry
+; RV64I-NOZBB-NEXT:    ret
+; RV64I-NOZBB-NEXT:  .LBB5_3: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a3
+; RV64I-NOZBB-NEXT:    bnez a2, .LBB5_2
+; RV64I-NOZBB-NEXT:  .LBB5_4: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a1
+; RV64I-NOZBB-NEXT:    ret
+;
+; RV32I-SFB-ZBB-LABEL: select_example_smin_1:
+; RV32I-SFB-ZBB:       # %bb.0: # %entry
+; RV32I-SFB-ZBB-NEXT:    sltu a7, a0, a5
+; RV32I-SFB-ZBB-NEXT:    slt t0, a1, a6
+; RV32I-SFB-ZBB-NEXT:    bne a1, a6, .LBB5_2
+; RV32I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv t0, a7
+; RV32I-SFB-ZBB-NEXT:  .LBB5_2: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez t0, .LBB5_4
+; RV32I-SFB-ZBB-NEXT:  # %bb.3: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a1, a6
+; RV32I-SFB-ZBB-NEXT:  .LBB5_4: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez t0, .LBB5_6
+; RV32I-SFB-ZBB-NEXT:  # %bb.5: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a0, a5
+; RV32I-SFB-ZBB-NEXT:  .LBB5_6: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez a4, .LBB5_8
+; RV32I-SFB-ZBB-NEXT:  # %bb.7: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a0, a2
+; RV32I-SFB-ZBB-NEXT:  .LBB5_8: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez a4, .LBB5_10
+; RV32I-SFB-ZBB-NEXT:  # %bb.9: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a1, a3
+; RV32I-SFB-ZBB-NEXT:  .LBB5_10: # %entry
+; RV32I-SFB-ZBB-NEXT:    ret
+;
+; RV64I-SFB-ZBB-LABEL: select_example_smin_1:
+; RV64I-SFB-ZBB:       # %bb.0: # %entry
+; RV64I-SFB-ZBB-NEXT:    beqz a2, .LBB5_2
+; RV64I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV64I-SFB-ZBB-NEXT:    min a1, a0, a3
+; RV64I-SFB-ZBB-NEXT:  .LBB5_2: # %entry
+; RV64I-SFB-ZBB-NEXT:    mv a0, a1
+; RV64I-SFB-ZBB-NEXT:    ret
+entry:
+  %res = call i64 @llvm.smin.i64(i64 %a, i64 %y)
+  %sel = select i1 %x, i64 %res, i64 %b
+  ret i64 %sel
+}
+
+define i64 @select_example_umax_1(i64 %a, i64 %b, i1 zeroext %x, i64 %y) {
+; RV32I-NOZBB-LABEL: select_example_umax_1:
+; RV32I-NOZBB:       # %bb.0: # %entry
+; RV32I-NOZBB-NEXT:    beq a1, a6, .LBB6_2
+; RV32I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV32I-NOZBB-NEXT:    sltu a7, a6, a1
+; RV32I-NOZBB-NEXT:    beqz a7, .LBB6_3
+; RV32I-NOZBB-NEXT:    j .LBB6_4
+; RV32I-NOZBB-NEXT:  .LBB6_2:
+; RV32I-NOZBB-NEXT:    sltu a7, a5, a0
+; RV32I-NOZBB-NEXT:    bnez a7, .LBB6_4
+; RV32I-NOZBB-NEXT:  .LBB6_3: # %entry
+; RV32I-NOZBB-NEXT:    mv a1, a6
+; RV32I-NOZBB-NEXT:    mv a0, a5
+; RV32I-NOZBB-NEXT:  .LBB6_4: # %entry
+; RV32I-NOZBB-NEXT:    beqz a4, .LBB6_6
+; RV32I-NOZBB-NEXT:  # %bb.5: # %entry
+; RV32I-NOZBB-NEXT:    ret
+; RV32I-NOZBB-NEXT:  .LBB6_6: # %entry
+; RV32I-NOZBB-NEXT:    mv a0, a2
+; RV32I-NOZBB-NEXT:    mv a1, a3
+; RV32I-NOZBB-NEXT:    ret
+;
+; RV64I-NOZBB-LABEL: select_example_umax_1:
+; RV64I-NOZBB:       # %bb.0: # %entry
+; RV64I-NOZBB-NEXT:    bgeu a3, a0, .LBB6_3
+; RV64I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV64I-NOZBB-NEXT:    beqz a2, .LBB6_4
+; RV64I-NOZBB-NEXT:  .LBB6_2: # %entry
+; RV64I-NOZBB-NEXT:    ret
+; RV64I-NOZBB-NEXT:  .LBB6_3: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a3
+; RV64I-NOZBB-NEXT:    bnez a2, .LBB6_2
+; RV64I-NOZBB-NEXT:  .LBB6_4: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a1
+; RV64I-NOZBB-NEXT:    ret
+;
+; RV32I-SFB-ZBB-LABEL: select_example_umax_1:
+; RV32I-SFB-ZBB:       # %bb.0: # %entry
+; RV32I-SFB-ZBB-NEXT:    sltu a7, a5, a0
+; RV32I-SFB-ZBB-NEXT:    sltu t0, a6, a1
+; RV32I-SFB-ZBB-NEXT:    bne a1, a6, .LBB6_2
+; RV32I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv t0, a7
+; RV32I-SFB-ZBB-NEXT:  .LBB6_2: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez t0, .LBB6_4
+; RV32I-SFB-ZBB-NEXT:  # %bb.3: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a1, a6
+; RV32I-SFB-ZBB-NEXT:  .LBB6_4: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez t0, .LBB6_6
+; RV32I-SFB-ZBB-NEXT:  # %bb.5: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a0, a5
+; RV32I-SFB-ZBB-NEXT:  .LBB6_6: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez a4, .LBB6_8
+; RV32I-SFB-ZBB-NEXT:  # %bb.7: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a0, a2
+; RV32I-SFB-ZBB-NEXT:  .LBB6_8: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez a4, .LBB6_10
+; RV32I-SFB-ZBB-NEXT:  # %bb.9: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a1, a3
+; RV32I-SFB-ZBB-NEXT:  .LBB6_10: # %entry
+; RV32I-SFB-ZBB-NEXT:    ret
+;
+; RV64I-SFB-ZBB-LABEL: select_example_umax_1:
+; RV64I-SFB-ZBB:       # %bb.0: # %entry
+; RV64I-SFB-ZBB-NEXT:    beqz a2, .LBB6_2
+; RV64I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV64I-SFB-ZBB-NEXT:    maxu a1, a0, a3
+; RV64I-SFB-ZBB-NEXT:  .LBB6_2: # %entry
+; RV64I-SFB-ZBB-NEXT:    mv a0, a1
+; RV64I-SFB-ZBB-NEXT:    ret
+entry:
+  %res = call i64 @llvm.umax.i64(i64 %a, i64 %y)
+  %sel = select i1 %x, i64 %res, i64 %b
+  ret i64 %sel
+}
+
+define i64 @select_example_umin_1(i64 %a, i64 %b, i1 zeroext %x, i64 %y) {
+; RV32I-NOZBB-LABEL: select_example_umin_1:
+; RV32I-NOZBB:       # %bb.0: # %entry
+; RV32I-NOZBB-NEXT:    beq a1, a6, .LBB7_2
+; RV32I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV32I-NOZBB-NEXT:    sltu a7, a1, a6
+; RV32I-NOZBB-NEXT:    beqz a7, .LBB7_3
+; RV32I-NOZBB-NEXT:    j .LBB7_4
+; RV32I-NOZBB-NEXT:  .LBB7_2:
+; RV32I-NOZBB-NEXT:    sltu a7, a0, a5
+; RV32I-NOZBB-NEXT:    bnez a7, .LBB7_4
+; RV32I-NOZBB-NEXT:  .LBB7_3: # %entry
+; RV32I-NOZBB-NEXT:    mv a1, a6
+; RV32I-NOZBB-NEXT:    mv a0, a5
+; RV32I-NOZBB-NEXT:  .LBB7_4: # %entry
+; RV32I-NOZBB-NEXT:    beqz a4, .LBB7_6
+; RV32I-NOZBB-NEXT:  # %bb.5: # %entry
+; RV32I-NOZBB-NEXT:    ret
+; RV32I-NOZBB-NEXT:  .LBB7_6: # %entry
+; RV32I-NOZBB-NEXT:    mv a0, a2
+; RV32I-NOZBB-NEXT:    mv a1, a3
+; RV32I-NOZBB-NEXT:    ret
+;
+; RV64I-NOZBB-LABEL: select_example_umin_1:
+; RV64I-NOZBB:       # %bb.0: # %entry
+; RV64I-NOZBB-NEXT:    bgeu a0, a3, .LBB7_3
+; RV64I-NOZBB-NEXT:  # %bb.1: # %entry
+; RV64I-NOZBB-NEXT:    beqz a2, .LBB7_4
+; RV64I-NOZBB-NEXT:  .LBB7_2: # %entry
+; RV64I-NOZBB-NEXT:    ret
+; RV64I-NOZBB-NEXT:  .LBB7_3: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a3
+; RV64I-NOZBB-NEXT:    bnez a2, .LBB7_2
+; RV64I-NOZBB-NEXT:  .LBB7_4: # %entry
+; RV64I-NOZBB-NEXT:    mv a0, a1
+; RV64I-NOZBB-NEXT:    ret
+;
+; RV32I-SFB-ZBB-LABEL: select_example_umin_1:
+; RV32I-SFB-ZBB:       # %bb.0: # %entry
+; RV32I-SFB-ZBB-NEXT:    sltu a7, a0, a5
+; RV32I-SFB-ZBB-NEXT:    sltu t0, a1, a6
+; RV32I-SFB-ZBB-NEXT:    bne a1, a6, .LBB7_2
+; RV32I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv t0, a7
+; RV32I-SFB-ZBB-NEXT:  .LBB7_2: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez t0, .LBB7_4
+; RV32I-SFB-ZBB-NEXT:  # %bb.3: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a1, a6
+; RV32I-SFB-ZBB-NEXT:  .LBB7_4: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez t0, .LBB7_6
+; RV32I-SFB-ZBB-NEXT:  # %bb.5: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a0, a5
+; RV32I-SFB-ZBB-NEXT:  .LBB7_6: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez a4, .LBB7_8
+; RV32I-SFB-ZBB-NEXT:  # %bb.7: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a0, a2
+; RV32I-SFB-ZBB-NEXT:  .LBB7_8: # %entry
+; RV32I-SFB-ZBB-NEXT:    bnez a4, .LBB7_10
+; RV32I-SFB-ZBB-NEXT:  # %bb.9: # %entry
+; RV32I-SFB-ZBB-NEXT:    mv a1, a3
+; RV32I-SFB-ZBB-NEXT:  .LBB7_10: # %entry
+; RV32I-SFB-ZBB-NEXT:    ret
+;
+; RV64I-SFB-ZBB-LABEL: select_example_umin_1:
+; RV64I-SFB-ZBB:       # %bb.0: # %entry
+; RV64I-SFB-ZBB-NEXT:    beqz a2, .LBB7_2
+; RV64I-SFB-ZBB-NEXT:  # %bb.1: # %entry
+; RV64I-SFB-ZBB-NEXT:    minu a1, a0, a3
+; RV64I-SFB-ZBB-NEXT:  .LBB7_2: # %entry
+; RV64I-SFB-ZBB-NEXT:    mv a0, a1
+; RV64I-SFB-ZBB-NEXT:    ret
+entry:
+  %res = call i64 @llvm.umin.i64(i64 %a, i64 %y)
+  %sel = select i1 %x, i64 %res, i64 %b
+  ret i64 %sel
+}



More information about the llvm-commits mailing list