[llvm] r176410 - ARM NEON: Fix v2f32 float intrinsics

Arnold Schwaighofer aschwaighofer at apple.com
Sat Mar 2 11:43:03 PST 2013


Umpf, I forgot to include the bug id. Sorry.

Fixes bug 15416.
radar://13330825



On Mar 2, 2013, at 1:38 PM, Arnold Schwaighofer <aschwaighofer at apple.com> wrote:

> Author: arnolds
> Date: Sat Mar  2 13:38:33 2013
> New Revision: 176410
> 
> URL: http://llvm.org/viewvc/llvm-project?rev=176410&view=rev
> Log:
> ARM NEON: Fix v2f32 float intrinsics
> 
> Mark them as expand, they are not legal as our backend does not match them.
> 
> Added:
>    llvm/trunk/test/CodeGen/ARM/vfloatintrinsics.ll
> Modified:
>    llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp
> 
> Modified: llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp?rev=176410&r1=176409&r2=176410&view=diff
> ==============================================================================
> --- llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp (original)
> +++ llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp Sat Mar  2 13:38:33 2013
> @@ -504,6 +504,7 @@ ARMTargetLowering::ARMTargetLowering(Tar
>     setOperationAction(ISD::FRINT, MVT::v2f64, Expand);
>     setOperationAction(ISD::FNEARBYINT, MVT::v2f64, Expand);
>     setOperationAction(ISD::FFLOOR, MVT::v2f64, Expand);
> +    setOperationAction(ISD::FMA, MVT::v2f64, Expand);
> 
>     setOperationAction(ISD::FSQRT, MVT::v4f32, Expand);
>     setOperationAction(ISD::FSIN, MVT::v4f32, Expand);
> @@ -521,6 +522,23 @@ ARMTargetLowering::ARMTargetLowering(Tar
>     setOperationAction(ISD::FNEARBYINT, MVT::v4f32, Expand);
>     setOperationAction(ISD::FFLOOR, MVT::v4f32, Expand);
> 
> +    // Mark v2f32 intrinsics.
> +    setOperationAction(ISD::FSQRT, MVT::v2f32, Expand);
> +    setOperationAction(ISD::FSIN, MVT::v2f32, Expand);
> +    setOperationAction(ISD::FCOS, MVT::v2f32, Expand);
> +    setOperationAction(ISD::FPOWI, MVT::v2f32, Expand);
> +    setOperationAction(ISD::FPOW, MVT::v2f32, Expand);
> +    setOperationAction(ISD::FLOG, MVT::v2f32, Expand);
> +    setOperationAction(ISD::FLOG2, MVT::v2f32, Expand);
> +    setOperationAction(ISD::FLOG10, MVT::v2f32, Expand);
> +    setOperationAction(ISD::FEXP, MVT::v2f32, Expand);
> +    setOperationAction(ISD::FEXP2, MVT::v2f32, Expand);
> +    setOperationAction(ISD::FCEIL, MVT::v2f32, Expand);
> +    setOperationAction(ISD::FTRUNC, MVT::v2f32, Expand);
> +    setOperationAction(ISD::FRINT, MVT::v2f32, Expand);
> +    setOperationAction(ISD::FNEARBYINT, MVT::v2f32, Expand);
> +    setOperationAction(ISD::FFLOOR, MVT::v2f32, Expand);
> +
>     // Neon does not support some operations on v1i64 and v2i64 types.
>     setOperationAction(ISD::MUL, MVT::v1i64, Expand);
>     // Custom handling for some quad-vector types to detect VMULL.
> 
> Added: llvm/trunk/test/CodeGen/ARM/vfloatintrinsics.ll
> URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/ARM/vfloatintrinsics.ll?rev=176410&view=auto
> ==============================================================================
> --- llvm/trunk/test/CodeGen/ARM/vfloatintrinsics.ll (added)
> +++ llvm/trunk/test/CodeGen/ARM/vfloatintrinsics.ll Sat Mar  2 13:38:33 2013
> @@ -0,0 +1,377 @@
> +; RUN: llc -mcpu=swift -march=arm < %s | FileCheck %s
> +target datalayout = "e-p:32:32:32-i1:8:32-i8:8:32-i16:16:32-i32:32:32-i64:32:64-f32:32:32-f64:32:64-v64:32:64-v128:32:128-a0:0:32-n32-S32"
> +target triple = "thumbv7-apple-ios6.1.0"
> +
> +;;; Float vectors
> +
> +%v2f32 = type <2 x float>
> +; CHECK: test_v2f32.sqrt:
> +define %v2f32 @test_v2f32.sqrt(%v2f32 %a) {
> +  ; CHECK: sqrt
> +  %1 = call %v2f32 @llvm.sqrt.v2f32(%v2f32 %a)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.powi:
> +define %v2f32 @test_v2f32.powi(%v2f32 %a, i32 %b) {
> +  ; CHECK: pow
> +  %1 = call %v2f32 @llvm.powi.v2f32(%v2f32 %a, i32 %b)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.sin:
> +define %v2f32 @test_v2f32.sin(%v2f32 %a) {
> +  ; CHECK: sin
> +  %1 = call %v2f32 @llvm.sin.v2f32(%v2f32 %a)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.cos:
> +define %v2f32 @test_v2f32.cos(%v2f32 %a) {
> +  ; CHECK: cos
> +  %1 = call %v2f32 @llvm.cos.v2f32(%v2f32 %a)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.pow:
> +define %v2f32 @test_v2f32.pow(%v2f32 %a, %v2f32 %b) {
> +  ; CHECK: pow
> +  %1 = call %v2f32 @llvm.pow.v2f32(%v2f32 %a, %v2f32 %b)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.exp:
> +define %v2f32 @test_v2f32.exp(%v2f32 %a) {
> +  ; CHECK: exp
> +  %1 = call %v2f32 @llvm.exp.v2f32(%v2f32 %a)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.exp2:
> +define %v2f32 @test_v2f32.exp2(%v2f32 %a) {
> +  ; CHECK: exp
> +  %1 = call %v2f32 @llvm.exp2.v2f32(%v2f32 %a)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.log:
> +define %v2f32 @test_v2f32.log(%v2f32 %a) {
> +  ; CHECK: log
> +  %1 = call %v2f32 @llvm.log.v2f32(%v2f32 %a)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.log10:
> +define %v2f32 @test_v2f32.log10(%v2f32 %a) {
> +  ; CHECK: log
> +  %1 = call %v2f32 @llvm.log10.v2f32(%v2f32 %a)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.log2:
> +define %v2f32 @test_v2f32.log2(%v2f32 %a) {
> +  ; CHECK: log
> +  %1 = call %v2f32 @llvm.log2.v2f32(%v2f32 %a)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.fma:
> +define %v2f32 @test_v2f32.fma(%v2f32 %a, %v2f32 %b, %v2f32 %c) {
> +  ; CHECK: fma
> +  %1 = call %v2f32 @llvm.fma.v2f32(%v2f32 %a, %v2f32 %b, %v2f32 %c)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.fabs:
> +define %v2f32 @test_v2f32.fabs(%v2f32 %a) {
> +  ; CHECK: fabs
> +  %1 = call %v2f32 @llvm.fabs.v2f32(%v2f32 %a)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.floor:
> +define %v2f32 @test_v2f32.floor(%v2f32 %a) {
> +  ; CHECK: floor
> +  %1 = call %v2f32 @llvm.floor.v2f32(%v2f32 %a)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.fceil:
> +define %v2f32 @test_v2f32.fceil(%v2f32 %a) {
> +  ; CHECK: ceil
> +  %1 = call %v2f32 @llvm.fceil.v2f32(%v2f32 %a)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.trunc:
> +define %v2f32 @test_v2f32.trunc(%v2f32 %a) {
> +  ; CHECK: trunc
> +  %1 = call %v2f32 @llvm.trunc.v2f32(%v2f32 %a)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.rint:
> +define %v2f32 @test_v2f32.rint(%v2f32 %a) {
> +  ; CHECK: rint
> +  %1 = call %v2f32 @llvm.rint.v2f32(%v2f32 %a)
> +  ret %v2f32 %1
> +}
> +; CHECK: test_v2f32.nearbyint:
> +define %v2f32 @test_v2f32.nearbyint(%v2f32 %a) {
> +  ; CHECK: nearbyint
> +  %1 = call %v2f32 @llvm.nearbyint.v2f32(%v2f32 %a)
> +  ret %v2f32 %1
> +}
> +
> +declare %v2f32 @llvm.sqrt.v2f32(%v2f32) #0
> +declare %v2f32 @llvm.powi.v2f32(%v2f32, i32) #0
> +declare %v2f32 @llvm.sin.v2f32(%v2f32) #0
> +declare %v2f32 @llvm.cos.v2f32(%v2f32) #0
> +declare %v2f32 @llvm.pow.v2f32(%v2f32, %v2f32) #0
> +declare %v2f32 @llvm.exp.v2f32(%v2f32) #0
> +declare %v2f32 @llvm.exp2.v2f32(%v2f32) #0
> +declare %v2f32 @llvm.log.v2f32(%v2f32) #0
> +declare %v2f32 @llvm.log10.v2f32(%v2f32) #0
> +declare %v2f32 @llvm.log2.v2f32(%v2f32) #0
> +declare %v2f32 @llvm.fma.v2f32(%v2f32, %v2f32, %v2f32) #0
> +declare %v2f32 @llvm.fabs.v2f32(%v2f32) #0
> +declare %v2f32 @llvm.floor.v2f32(%v2f32) #0
> +declare %v2f32 @llvm.fceil.v2f32(%v2f32) #0
> +declare %v2f32 @llvm.trunc.v2f32(%v2f32) #0
> +declare %v2f32 @llvm.rint.v2f32(%v2f32) #0
> +declare %v2f32 @llvm.nearbyint.v2f32(%v2f32) #0
> +
> +;;;
> +
> +%v4f32 = type <4 x float>
> +; CHECK: test_v4f32.sqrt:
> +define %v4f32 @test_v4f32.sqrt(%v4f32 %a) {
> +  ; CHECK: sqrt
> +  %1 = call %v4f32 @llvm.sqrt.v4f32(%v4f32 %a)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.powi:
> +define %v4f32 @test_v4f32.powi(%v4f32 %a, i32 %b) {
> +  ; CHECK: pow
> +  %1 = call %v4f32 @llvm.powi.v4f32(%v4f32 %a, i32 %b)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.sin:
> +define %v4f32 @test_v4f32.sin(%v4f32 %a) {
> +  ; CHECK: sin
> +  %1 = call %v4f32 @llvm.sin.v4f32(%v4f32 %a)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.cos:
> +define %v4f32 @test_v4f32.cos(%v4f32 %a) {
> +  ; CHECK: cos
> +  %1 = call %v4f32 @llvm.cos.v4f32(%v4f32 %a)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.pow:
> +define %v4f32 @test_v4f32.pow(%v4f32 %a, %v4f32 %b) {
> +  ; CHECK: pow
> +  %1 = call %v4f32 @llvm.pow.v4f32(%v4f32 %a, %v4f32 %b)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.exp:
> +define %v4f32 @test_v4f32.exp(%v4f32 %a) {
> +  ; CHECK: exp
> +  %1 = call %v4f32 @llvm.exp.v4f32(%v4f32 %a)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.exp2:
> +define %v4f32 @test_v4f32.exp2(%v4f32 %a) {
> +  ; CHECK: exp
> +  %1 = call %v4f32 @llvm.exp2.v4f32(%v4f32 %a)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.log:
> +define %v4f32 @test_v4f32.log(%v4f32 %a) {
> +  ; CHECK: log
> +  %1 = call %v4f32 @llvm.log.v4f32(%v4f32 %a)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.log10:
> +define %v4f32 @test_v4f32.log10(%v4f32 %a) {
> +  ; CHECK: log
> +  %1 = call %v4f32 @llvm.log10.v4f32(%v4f32 %a)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.log2:
> +define %v4f32 @test_v4f32.log2(%v4f32 %a) {
> +  ; CHECK: log
> +  %1 = call %v4f32 @llvm.log2.v4f32(%v4f32 %a)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.fma:
> +define %v4f32 @test_v4f32.fma(%v4f32 %a, %v4f32 %b, %v4f32 %c) {
> +  ; CHECK: fma
> +  %1 = call %v4f32 @llvm.fma.v4f32(%v4f32 %a, %v4f32 %b, %v4f32 %c)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.fabs:
> +define %v4f32 @test_v4f32.fabs(%v4f32 %a) {
> +  ; CHECK: fabs
> +  %1 = call %v4f32 @llvm.fabs.v4f32(%v4f32 %a)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.floor:
> +define %v4f32 @test_v4f32.floor(%v4f32 %a) {
> +  ; CHECK: floor
> +  %1 = call %v4f32 @llvm.floor.v4f32(%v4f32 %a)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.fceil:
> +define %v4f32 @test_v4f32.fceil(%v4f32 %a) {
> +  ; CHECK: ceil
> +  %1 = call %v4f32 @llvm.fceil.v4f32(%v4f32 %a)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.trunc:
> +define %v4f32 @test_v4f32.trunc(%v4f32 %a) {
> +  ; CHECK: trunc
> +  %1 = call %v4f32 @llvm.trunc.v4f32(%v4f32 %a)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.rint:
> +define %v4f32 @test_v4f32.rint(%v4f32 %a) {
> +  ; CHECK: rint
> +  %1 = call %v4f32 @llvm.rint.v4f32(%v4f32 %a)
> +  ret %v4f32 %1
> +}
> +; CHECK: test_v4f32.nearbyint:
> +define %v4f32 @test_v4f32.nearbyint(%v4f32 %a) {
> +  ; CHECK: nearbyint
> +  %1 = call %v4f32 @llvm.nearbyint.v4f32(%v4f32 %a)
> +  ret %v4f32 %1
> +}
> +
> +declare %v4f32 @llvm.sqrt.v4f32(%v4f32) #0
> +declare %v4f32 @llvm.powi.v4f32(%v4f32, i32) #0
> +declare %v4f32 @llvm.sin.v4f32(%v4f32) #0
> +declare %v4f32 @llvm.cos.v4f32(%v4f32) #0
> +declare %v4f32 @llvm.pow.v4f32(%v4f32, %v4f32) #0
> +declare %v4f32 @llvm.exp.v4f32(%v4f32) #0
> +declare %v4f32 @llvm.exp2.v4f32(%v4f32) #0
> +declare %v4f32 @llvm.log.v4f32(%v4f32) #0
> +declare %v4f32 @llvm.log10.v4f32(%v4f32) #0
> +declare %v4f32 @llvm.log2.v4f32(%v4f32) #0
> +declare %v4f32 @llvm.fma.v4f32(%v4f32, %v4f32, %v4f32) #0
> +declare %v4f32 @llvm.fabs.v4f32(%v4f32) #0
> +declare %v4f32 @llvm.floor.v4f32(%v4f32) #0
> +declare %v4f32 @llvm.fceil.v4f32(%v4f32) #0
> +declare %v4f32 @llvm.trunc.v4f32(%v4f32) #0
> +declare %v4f32 @llvm.rint.v4f32(%v4f32) #0
> +declare %v4f32 @llvm.nearbyint.v4f32(%v4f32) #0
> +
> +;;; Double vector
> +
> +%v2f64 = type <2 x double>
> +; CHECK: test_v2f64.sqrt:
> +define %v2f64 @test_v2f64.sqrt(%v2f64 %a) {
> +  ; CHECK: sqrt
> +  %1 = call %v2f64 @llvm.sqrt.v2f64(%v2f64 %a)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.powi:
> +define %v2f64 @test_v2f64.powi(%v2f64 %a, i32 %b) {
> +  ; CHECK: pow
> +  %1 = call %v2f64 @llvm.powi.v2f64(%v2f64 %a, i32 %b)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.sin:
> +define %v2f64 @test_v2f64.sin(%v2f64 %a) {
> +  ; CHECK: sin
> +  %1 = call %v2f64 @llvm.sin.v2f64(%v2f64 %a)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.cos:
> +define %v2f64 @test_v2f64.cos(%v2f64 %a) {
> +  ; CHECK: cos
> +  %1 = call %v2f64 @llvm.cos.v2f64(%v2f64 %a)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.pow:
> +define %v2f64 @test_v2f64.pow(%v2f64 %a, %v2f64 %b) {
> +  ; CHECK: pow
> +  %1 = call %v2f64 @llvm.pow.v2f64(%v2f64 %a, %v2f64 %b)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.exp:
> +define %v2f64 @test_v2f64.exp(%v2f64 %a) {
> +  ; CHECK: exp
> +  %1 = call %v2f64 @llvm.exp.v2f64(%v2f64 %a)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.exp2:
> +define %v2f64 @test_v2f64.exp2(%v2f64 %a) {
> +  ; CHECK: exp
> +  %1 = call %v2f64 @llvm.exp2.v2f64(%v2f64 %a)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.log:
> +define %v2f64 @test_v2f64.log(%v2f64 %a) {
> +  ; CHECK: log
> +  %1 = call %v2f64 @llvm.log.v2f64(%v2f64 %a)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.log10:
> +define %v2f64 @test_v2f64.log10(%v2f64 %a) {
> +  ; CHECK: log
> +  %1 = call %v2f64 @llvm.log10.v2f64(%v2f64 %a)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.log2:
> +define %v2f64 @test_v2f64.log2(%v2f64 %a) {
> +  ; CHECK: log
> +  %1 = call %v2f64 @llvm.log2.v2f64(%v2f64 %a)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.fma:
> +define %v2f64 @test_v2f64.fma(%v2f64 %a, %v2f64 %b, %v2f64 %c) {
> +  ; CHECK: fma
> +  %1 = call %v2f64 @llvm.fma.v2f64(%v2f64 %a, %v2f64 %b, %v2f64 %c)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.fabs:
> +define %v2f64 @test_v2f64.fabs(%v2f64 %a) {
> +  ; CHECK: fabs
> +  %1 = call %v2f64 @llvm.fabs.v2f64(%v2f64 %a)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.floor:
> +define %v2f64 @test_v2f64.floor(%v2f64 %a) {
> +  ; CHECK: floor
> +  %1 = call %v2f64 @llvm.floor.v2f64(%v2f64 %a)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.fceil:
> +define %v2f64 @test_v2f64.fceil(%v2f64 %a) {
> +  ; CHECK: ceil
> +  %1 = call %v2f64 @llvm.fceil.v2f64(%v2f64 %a)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.trunc:
> +define %v2f64 @test_v2f64.trunc(%v2f64 %a) {
> +  ; CHECK: trunc
> +  %1 = call %v2f64 @llvm.trunc.v2f64(%v2f64 %a)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.rint:
> +define %v2f64 @test_v2f64.rint(%v2f64 %a) {
> +  ; CHECK: rint
> +  %1 = call %v2f64 @llvm.rint.v2f64(%v2f64 %a)
> +  ret %v2f64 %1
> +}
> +; CHECK: test_v2f64.nearbyint:
> +define %v2f64 @test_v2f64.nearbyint(%v2f64 %a) {
> +  ; CHECK: nearbyint
> +  %1 = call %v2f64 @llvm.nearbyint.v2f64(%v2f64 %a)
> +  ret %v2f64 %1
> +}
> +
> +declare %v2f64 @llvm.sqrt.v2f64(%v2f64) #0
> +declare %v2f64 @llvm.powi.v2f64(%v2f64, i32) #0
> +declare %v2f64 @llvm.sin.v2f64(%v2f64) #0
> +declare %v2f64 @llvm.cos.v2f64(%v2f64) #0
> +declare %v2f64 @llvm.pow.v2f64(%v2f64, %v2f64) #0
> +declare %v2f64 @llvm.exp.v2f64(%v2f64) #0
> +declare %v2f64 @llvm.exp2.v2f64(%v2f64) #0
> +declare %v2f64 @llvm.log.v2f64(%v2f64) #0
> +declare %v2f64 @llvm.log10.v2f64(%v2f64) #0
> +declare %v2f64 @llvm.log2.v2f64(%v2f64) #0
> +declare %v2f64 @llvm.fma.v2f64(%v2f64, %v2f64, %v2f64) #0
> +declare %v2f64 @llvm.fabs.v2f64(%v2f64) #0
> +declare %v2f64 @llvm.floor.v2f64(%v2f64) #0
> +declare %v2f64 @llvm.fceil.v2f64(%v2f64) #0
> +declare %v2f64 @llvm.trunc.v2f64(%v2f64) #0
> +declare %v2f64 @llvm.rint.v2f64(%v2f64) #0
> +declare %v2f64 @llvm.nearbyint.v2f64(%v2f64) #0
> +
> +attributes #0 = { nounwind readonly }
> 
> 
> _______________________________________________
> llvm-commits mailing list
> llvm-commits at cs.uiuc.edu
> http://lists.cs.uiuc.edu/mailman/listinfo/llvm-commits




More information about the llvm-commits mailing list