[llvm] de681d5 - [PowerPC] Do not attempt to combine fptoui without FPCVT

Nemanja Ivanovic via llvm-commits llvm-commits at lists.llvm.org
Wed May 24 09:14:38 PDT 2023


Author: Nemanja Ivanovic
Date: 2023-05-24T11:14:26-05:00
New Revision: de681d53ba8278ebb14b056bd7a2385bbe48ad82

URL: https://github.com/llvm/llvm-project/commit/de681d53ba8278ebb14b056bd7a2385bbe48ad82
DIFF: https://github.com/llvm/llvm-project/commit/de681d53ba8278ebb14b056bd7a2385bbe48ad82.diff

LOG: [PowerPC] Do not attempt to combine fptoui without FPCVT

Commit 8064caf83fb166b709bfe0e7641c5181341cb064 added a call
to a function that performs this combine without checking whether
the target supports FPCVT. This caused asserts to trip on BE bots
as the default target does not have this feature.

Added: 
    llvm/test/CodeGen/PowerPC/fptoui-be-crash.ll

Modified: 
    llvm/lib/Target/PowerPC/PPCISelLowering.cpp

Removed: 
    


################################################################################
diff  --git a/llvm/lib/Target/PowerPC/PPCISelLowering.cpp b/llvm/lib/Target/PowerPC/PPCISelLowering.cpp
index 358be0a69a0cc..b51abdb17d31f 100644
--- a/llvm/lib/Target/PowerPC/PPCISelLowering.cpp
+++ b/llvm/lib/Target/PowerPC/PPCISelLowering.cpp
@@ -15515,8 +15515,10 @@ SDValue PPCTargetLowering::PerformDAGCombine(SDNode *N,
 
     EVT Op1VT = N->getOperand(1).getValueType();
     unsigned Opcode = N->getOperand(1).getOpcode();
+    bool NeedsFPCVT = Opcode == ISD::FP_TO_UINT && Op1VT == MVT::i64;
 
-    if (Opcode == ISD::FP_TO_SINT || Opcode == ISD::FP_TO_UINT) {
+    if ((Opcode == ISD::FP_TO_SINT || Opcode == ISD::FP_TO_UINT) &&
+        (!NeedsFPCVT || Subtarget.hasFPCVT())) {
       SDValue Val= combineStoreFPToInt(N, DCI);
       if (Val)
         return Val;

diff  --git a/llvm/test/CodeGen/PowerPC/fptoui-be-crash.ll b/llvm/test/CodeGen/PowerPC/fptoui-be-crash.ll
new file mode 100644
index 0000000000000..fc93f893b1d5d
--- /dev/null
+++ b/llvm/test/CodeGen/PowerPC/fptoui-be-crash.ll
@@ -0,0 +1,76 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 2
+; RUN: llc -verify-machineinstrs -ppc-asm-full-reg-names \
+; RUN:   -mtriple=powerpc64-unknown-linux-gnu < %s | FileCheck %s
+define dso_local void @calc_buffer() local_unnamed_addr #0 {
+; CHECK-LABEL: calc_buffer:
+; CHECK:       # %bb.0:
+; CHECK-NEXT:    ld r3, 0(r3)
+; CHECK-NEXT:    sradi r5, r3, 53
+; CHECK-NEXT:    rldicl r6, r3, 63, 1
+; CHECK-NEXT:    clrldi r7, r3, 63
+; CHECK-NEXT:    clrldi r4, r3, 53
+; CHECK-NEXT:    addi r5, r5, 1
+; CHECK-NEXT:    or r7, r7, r6
+; CHECK-NEXT:    cmpldi r5, 1
+; CHECK-NEXT:    clrldi r5, r7, 53
+; CHECK-NEXT:    addi r4, r4, 2047
+; CHECK-NEXT:    addi r5, r5, 2047
+; CHECK-NEXT:    or r5, r5, r6
+; CHECK-NEXT:    rldicl r6, r3, 10, 54
+; CHECK-NEXT:    or r4, r4, r3
+; CHECK-NEXT:    addi r6, r6, 1
+; CHECK-NEXT:    rldicl r5, r5, 53, 11
+; CHECK-NEXT:    cmpldi cr1, r6, 1
+; CHECK-NEXT:    rldicr r4, r4, 0, 52
+; CHECK-NEXT:    rldicl r5, r5, 11, 1
+; CHECK-NEXT:    bc 12, gt, .LBB0_2
+; CHECK-NEXT:  # %bb.1:
+; CHECK-NEXT:    ori r4, r3, 0
+; CHECK-NEXT:    b .LBB0_2
+; CHECK-NEXT:  .LBB0_2:
+; CHECK-NEXT:    bc 12, 4*cr1+gt, .LBB0_4
+; CHECK-NEXT:  # %bb.3:
+; CHECK-NEXT:    ori r5, r7, 0
+; CHECK-NEXT:    b .LBB0_4
+; CHECK-NEXT:  .LBB0_4:
+; CHECK-NEXT:    cmpdi r3, 0
+; CHECK-NEXT:    std r4, -32(r1)
+; CHECK-NEXT:    std r5, -24(r1)
+; CHECK-NEXT:    bc 12, lt, .LBB0_6
+; CHECK-NEXT:  # %bb.5:
+; CHECK-NEXT:    lfd f0, -32(r1)
+; CHECK-NEXT:    fcfid f0, f0
+; CHECK-NEXT:    frsp f0, f0
+; CHECK-NEXT:    b .LBB0_7
+; CHECK-NEXT:  .LBB0_6:
+; CHECK-NEXT:    lfd f0, -24(r1)
+; CHECK-NEXT:    fcfid f0, f0
+; CHECK-NEXT:    frsp f0, f0
+; CHECK-NEXT:    fadds f0, f0, f0
+; CHECK-NEXT:  .LBB0_7:
+; CHECK-NEXT:    addis r3, r2, .LCPI0_0 at toc@ha
+; CHECK-NEXT:    li r4, 1
+; CHECK-NEXT:    lfs f1, .LCPI0_0 at toc@l(r3)
+; CHECK-NEXT:    rldic r4, r4, 63, 0
+; CHECK-NEXT:    fsubs f2, f0, f1
+; CHECK-NEXT:    fctidz f2, f2
+; CHECK-NEXT:    stfd f2, -8(r1)
+; CHECK-NEXT:    fctidz f2, f0
+; CHECK-NEXT:    stfd f2, -16(r1)
+; CHECK-NEXT:    ld r3, -8(r1)
+; CHECK-NEXT:    ld r5, -16(r1)
+; CHECK-NEXT:    fcmpu cr0, f0, f1
+; CHECK-NEXT:    xor r3, r3, r4
+; CHECK-NEXT:    bc 12, lt, .LBB0_8
+; CHECK-NEXT:    b .LBB0_9
+; CHECK-NEXT:  .LBB0_8:
+; CHECK-NEXT:    addi r3, r5, 0
+; CHECK-NEXT:  .LBB0_9:
+; CHECK-NEXT:    std r3, 0(r3)
+  %load_initial = load i64, ptr poison, align 8
+  %conv39 = uitofp i64 %load_initial to float
+  %add48 = fadd float 0.000000e+00, %conv39
+  %conv49 = fptoui float %add48 to i64
+  store i64 %conv49, ptr poison, align 8
+  unreachable
+}


        


More information about the llvm-commits mailing list