[llvm] r328691 - [ARM] Support float literals under XO

Wed Mar 28 03:02:27 PDT 2018

Author: christof
Date: Wed Mar 28 03:02:26 2018
New Revision: 328691

URL: http://llvm.org/viewvc/llvm-project?rev=328691&view=rev
Log:
[ARM] Support float literals under XO

Follow up patch of r328313 to support the UseVMOVSR constraint. Removed
some unneeded instructions from the test and removed some stray
comments.

Differential Revision: https://reviews.llvm.org/D44941

Modified:
    llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp
    llvm/trunk/lib/Target/ARM/ARMInstrNEON.td
    llvm/trunk/lib/Target/ARM/ARMInstrVFP.td
    llvm/trunk/test/CodeGen/ARM/fcmp-xo.ll

Modified: llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp?rev=328691&r1=328690&r2=328691&view=diff
==============================================================================

--- llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp (original)
+++ llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp Wed Mar 28 03:02:26 2018
@@ -4519,8 +4519,8 @@ SDValue ARMTargetLowering::LowerSELECT_C
   bool InvalidOnQNaN;
   FPCCToARMCC(CC, CondCode, CondCode2, InvalidOnQNaN);
 
-  // Try to generate VMAXNM/VMINNM on ARMv8. Except if we compare to a zero.
-  // This ensures we use CMPFPw0 instead of CMPFP in such case.
+  // Normalize the fp compare. If RHS is zero we keep it there so we match
+  // CMPFPw0 instead of CMPFP.
   if (Subtarget->hasFPARMv8() && !isFloatingPointZero(RHS) &&
     (TrueVal.getValueType() == MVT::f32 || TrueVal.getValueType() == MVT::f64)) {
     bool swpCmpOps = false;

Modified: llvm/trunk/lib/Target/ARM/ARMInstrNEON.td
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ARMInstrNEON.td?rev=328691&r1=328690&r2=328691&view=diff
==============================================================================
--- llvm/trunk/lib/Target/ARM/ARMInstrNEON.td (original)
+++ llvm/trunk/lib/Target/ARM/ARMInstrNEON.td Wed Mar 28 03:02:26 2018
@@ -6935,6 +6935,9 @@ def : VFPPat<(f64 (uint_to_fp (extractel
 def : Pat<(f32 (bitconvert GPR:$a)),
           (EXTRACT_SUBREG (VMOVDRR GPR:$a, GPR:$a), ssub_0)>,
         Requires<[HasNEON, DontUseVMOVSR]>;
+def : Pat<(arm_vmovsr GPR:$a),
+          (EXTRACT_SUBREG (VMOVDRR GPR:$a, GPR:$a), ssub_0)>,
+        Requires<[HasNEON, DontUseVMOVSR]>;
 
 //===----------------------------------------------------------------------===//
 // Non-Instruction Patterns

Modified: llvm/trunk/lib/Target/ARM/ARMInstrVFP.td
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ARMInstrVFP.td?rev=328691&r1=328690&r2=328691&view=diff
==============================================================================
--- llvm/trunk/lib/Target/ARM/ARMInstrVFP.td (original)
+++ llvm/trunk/lib/Target/ARM/ARMInstrVFP.td Wed Mar 28 03:02:26 2018
@@ -1069,7 +1069,7 @@ def VMOVSR : AVConv4I<0b11100000, 0b1010
   // pipelines.
   let D = VFPNeonDomain;
 }
-def : Pat<(arm_vmovsr GPR:$Rt), (VMOVSR GPR:$Rt)>;
+def : Pat<(arm_vmovsr GPR:$Rt), (VMOVSR GPR:$Rt)>, Requires<[HasVFP2, UseVMOVSR]>;
 
 let hasSideEffects = 0 in {
 def VMOVRRD  : AVConv3I<0b11000101, 0b1011,

Modified: llvm/trunk/test/CodeGen/ARM/fcmp-xo.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/ARM/fcmp-xo.ll?rev=328691&r1=328690&r2=328691&view=diff
==============================================================================
--- llvm/trunk/test/CodeGen/ARM/fcmp-xo.ll (original)
+++ llvm/trunk/test/CodeGen/ARM/fcmp-xo.ll Wed Mar 28 03:02:26 2018
@@ -1,118 +1,61 @@
-; RUN: llc -mtriple=thumbv7m-arm-none-eabi -mattr=+execute-only,+fp-armv8 %s -o - | FileCheck %s
+; RUN: llc -mtriple=thumbv7m-arm-none-eabi -mattr=+execute-only,+fp-armv8 %s -o - | FileCheck --check-prefixes=CHECK,VMOVSR %s
+; RUN: llc -mtriple=thumbv7m-arm-none-eabi -mattr=+execute-only,+fp-armv8,+neon,+neonfp %s -o - | FileCheck --check-prefixes=CHECK,NEON %s
 
-; This function used to run into a code selection error on fp-armv8 due to
-; different ordering of the constant arguments of fcmp. Fixed by extending the
-; code selection to handle the missing case.
-define arm_aapcs_vfpcc void @foo0() local_unnamed_addr {
-  br i1 undef, label %.end, label %1
-
-  %2 = fcmp nsz olt float undef, 0.000000e+00
-  %3 = select i1 %2, float -5.000000e-01, float 5.000000e-01
-  %4 = fadd nsz float undef, %3
-  %5 = fptosi float %4 to i32
-  %6 = ashr i32 %5, 4
-  %7 = icmp slt i32 %6, 0
-  br i1 %7, label %8, label %.end
-
-  tail call arm_aapcs_vfpcc void @bar()
-  br label %.end
-
-.end:
-  ret void
+define arm_aapcs_vfpcc float @foo0() local_unnamed_addr {
+  %1 = fcmp nsz olt float undef, 0.000000e+00
+  %2 = select i1 %1, float -5.000000e-01, float 5.000000e-01
+  ret float %2
 }
 ; CHECK-LABEL: foo0
 ; CHECK: vcmpe.f32 {{s[0-9]+}}, #0
 
 
-define arm_aapcs_vfpcc void @float1() local_unnamed_addr {
+define arm_aapcs_vfpcc float @float1() local_unnamed_addr {
   br i1 undef, label %.end, label %1
 
   %2 = fcmp nsz olt float undef, 1.000000e+00
   %3 = select i1 %2, float -5.000000e-01, float 5.000000e-01
-  %4 = fadd nsz float undef, %3
-  %5 = fptosi float %4 to i32
-  %6 = ashr i32 %5, 4
-  %7 = icmp slt i32 %6, 0
-  br i1 %7, label %8, label %.end
-
-  tail call arm_aapcs_vfpcc void @bar()
   br label %.end
 
 .end:
-  ret void
+  %4 = phi float [ undef, %0 ], [ %3, %1]
+  ret float %4
 }
 ; CHECK-LABEL: float1
 ; CHECK: vmov.f32 [[FPREG:s[0-9]+]], #1.000000e+00
 ; CHECK: vcmpe.f32 [[FPREG]], {{s[0-9]+}}
 
-define arm_aapcs_vfpcc void @float128() local_unnamed_addr {
-  br i1 undef, label %.end, label %1
-
-  %2 = fcmp nsz olt float undef, 128.000000e+00
-  %3 = select i1 %2, float -5.000000e-01, float 5.000000e-01
-  %4 = fadd nsz float undef, %3
-  %5 = fptosi float %4 to i32
-  %6 = ashr i32 %5, 4
-  %7 = icmp slt i32 %6, 0
-  br i1 %7, label %8, label %.end
-
-  tail call arm_aapcs_vfpcc void @bar()
-  br label %.end
-
-.end:
-  ret void
+define arm_aapcs_vfpcc float @float128() local_unnamed_addr {
+  %1 = fcmp nsz olt float undef, 128.000000e+00
+  %2 = select i1 %1, float -5.000000e-01, float 5.000000e-01
+  ret float %2
 }
 ; CHECK-LABEL: float128
 ; CHECK: mov.w [[REG:r[0-9]+]], #1124073472
-; CHECK: vmov [[FPREG:s[0-9]+]], [[REG]]
-; CHECK: vcmpe.f32 [[FPREG]], {{s[0-9]+}}
+; VMOVSR: vmov [[FPREG:s[0-9]+]], [[REG]]
+; VMOVSR: vcmpe.f32 [[FPREG]], {{s[0-9]+}}
+; NEON: vmov d2, [[REG]], [[REG]]
+; NEON: vcmpe.f32 s4, {{s[0-9]+}}
 
 
-define arm_aapcs_vfpcc void @double1() local_unnamed_addr {
-  br i1 undef, label %.end, label %1
-
-  %2 = fcmp nsz olt double undef, 1.000000e+00
-  %3 = select i1 %2, double -5.000000e-01, double 5.000000e-01
-  %4 = fadd nsz double undef, %3
-  %5 = fptosi double %4 to i32
-  %6 = ashr i32 %5, 4
-  %7 = icmp slt i32 %6, 0
-  br i1 %7, label %8, label %.end
-
-  tail call arm_aapcs_vfpcc void @bar()
-  br label %.end
-
-.end:
-  ret void
+define arm_aapcs_vfpcc double @double1() local_unnamed_addr {
+  %1 = fcmp nsz olt double undef, 1.000000e+00
+  %2 = select i1 %1, double -5.000000e-01, double 5.000000e-01
+  ret double %2
 }
 ; CHECK-LABEL: double1
 ; CHECK: vmov.f64 [[FPREG:d[0-9]+]], #1.000000e+00
 ; CHECK: vcmpe.f64 [[FPREG]], {{d[0-9]+}}
 
-define arm_aapcs_vfpcc void @double128() local_unnamed_addr {
-  br i1 undef, label %.end, label %1
-
-  %2 = fcmp nsz olt double undef, 128.000000e+00
-  %3 = select i1 %2, double -5.000000e-01, double 5.000000e-01
-  %4 = fadd nsz double undef, %3
-  %5 = fptosi double %4 to i32
-  %6 = ashr i32 %5, 4
-  %7 = icmp slt i32 %6, 0
-  br i1 %7, label %8, label %.end
-
-  tail call arm_aapcs_vfpcc void @bar()
-  br label %.end
-
-.end:
-  ret void
+define arm_aapcs_vfpcc double @double128() local_unnamed_addr {
+  %1 = fcmp nsz olt double undef, 128.000000e+00
+  %2 = select i1 %1, double -5.000000e-01, double 5.000000e-01
+  ret double %2
 }
 ; CHECK-LABEL: double128
-; CHECK: movs [[REGL:r[0-9]+]], #0
 ; CHECK: movs [[REGH:r[0-9]+]], #0
 ; CHECK: movt [[REGH]], #16480
+; CHECK: movs [[REGL:r[0-9]+]], #0
 ; CHECK: vmov [[FPREG:d[0-9]+]], [[REGL]], [[REGH]]
 ; CHECK: vcmpe.f64 [[FPREG]], {{d[0-9]+}}
 
-
-declare arm_aapcs_vfpcc void @bar() local_unnamed_addr
-