r232968 - [CodeGen] Convert double -> __fp16 in one step.
Ahmed Bougacha
ahmed.bougacha at gmail.com
Mon Mar 23 10:48:07 PDT 2015
Author: ab
Date: Mon Mar 23 12:48:07 2015
New Revision: 232968
URL: http://llvm.org/viewvc/llvm-project?rev=232968&view=rev
Log:
[CodeGen] Convert double -> __fp16 in one step.
Fix the CodeGen so that for types bigger than float, instead of
converting to fp16 via the sequence "InTy -> float -> fp16", we
perform conversions in just one step. This avoids the double
rounding which potentially changes results from a natural
IEEE-754 operation.
rdar://17594379, rdar://17468714
Differential Revision: http://reviews.llvm.org/D4602
Part of: http://reviews.llvm.org/D8367
Modified:
cfe/trunk/lib/CodeGen/CGExprScalar.cpp
cfe/trunk/test/CodeGen/fp16-ops.c
Modified: cfe/trunk/lib/CodeGen/CGExprScalar.cpp
URL: http://llvm.org/viewvc/llvm-project/cfe/trunk/lib/CodeGen/CGExprScalar.cpp?rev=232968&r1=232967&r2=232968&view=diff
==============================================================================
--- cfe/trunk/lib/CodeGen/CGExprScalar.cpp (original)
+++ cfe/trunk/lib/CodeGen/CGExprScalar.cpp Mon Mar 23 12:48:07 2015
@@ -745,9 +745,20 @@ Value *ScalarExprEmitter::EmitScalarConv
QualType OrigSrcType = SrcType;
llvm::Type *SrcTy = Src->getType();
- // If casting to/from storage-only half FP, use special intrinsics.
+ // Handle conversions to bool first, they are special: comparisons against 0.
+ if (DstType->isBooleanType())
+ return EmitConversionToBool(Src, SrcType);
+
+ llvm::Type *DstTy = ConvertType(DstType);
+
+ // Cast from storage-only half FP using the special intrinsic.
if (SrcType->isHalfType() && !CGF.getContext().getLangOpts().NativeHalfType &&
!CGF.getContext().getLangOpts().HalfArgsAndReturns) {
+ if (DstTy->isFloatingPointTy())
+ return Builder.CreateCall(
+ CGF.CGM.getIntrinsic(llvm::Intrinsic::convert_from_fp16, DstTy), Src);
+
+ // If this isn't an FP->FP conversion, go through float.
Src = Builder.CreateCall(
CGF.CGM.getIntrinsic(llvm::Intrinsic::convert_from_fp16,
CGF.CGM.FloatTy),
@@ -756,12 +767,6 @@ Value *ScalarExprEmitter::EmitScalarConv
SrcTy = CGF.FloatTy;
}
- // Handle conversions to bool first, they are special: comparisons against 0.
- if (DstType->isBooleanType())
- return EmitConversionToBool(Src, SrcType);
-
- llvm::Type *DstTy = ConvertType(DstType);
-
// Ignore conversions like int -> uint.
if (SrcTy == DstTy)
return Src;
@@ -818,10 +823,14 @@ Value *ScalarExprEmitter::EmitScalarConv
EmitFloatConversionCheck(OrigSrc, OrigSrcType, Src, SrcType, DstType,
DstTy);
- // Cast to half via float
+ // Cast to half using the intrinsic if from FP type, through float otherwise.
if (DstType->isHalfType() && !CGF.getContext().getLangOpts().NativeHalfType &&
- !CGF.getContext().getLangOpts().HalfArgsAndReturns)
+ !CGF.getContext().getLangOpts().HalfArgsAndReturns) {
+ if (SrcTy->isFloatingPointTy())
+ return Builder.CreateCall(
+ CGF.CGM.getIntrinsic(llvm::Intrinsic::convert_to_fp16, SrcTy), Src);
DstTy = CGF.FloatTy;
+ }
if (isa<llvm::IntegerType>(SrcTy)) {
bool InputSigned = SrcType->isSignedIntegerOrEnumerationType();
Modified: cfe/trunk/test/CodeGen/fp16-ops.c
URL: http://llvm.org/viewvc/llvm-project/cfe/trunk/test/CodeGen/fp16-ops.c?rev=232968&r1=232967&r2=232968&view=diff
==============================================================================
--- cfe/trunk/test/CodeGen/fp16-ops.c (original)
+++ cfe/trunk/test/CodeGen/fp16-ops.c Mon Mar 23 12:48:07 2015
@@ -5,6 +5,7 @@ typedef unsigned cond_t;
volatile cond_t test;
volatile __fp16 h0 = 0.0, h1 = 1.0, h2;
volatile float f0, f1, f2;
+volatile double d0;
void foo(void) {
// CHECK-LABEL: define void @foo()
@@ -52,7 +53,7 @@ void foo(void) {
// CHECK: call float @llvm.convert.from.fp16.f32(
// CHECK: fmul float
// CHECK: call i16 @llvm.convert.to.fp16.f32(
- h1 = h0 * (__fp16) -2.0;
+ h1 = h0 * (__fp16) -2.0f;
// CHECK: call float @llvm.convert.from.fp16.f32(
// CHECK: fmul float
// CHECK: call i16 @llvm.convert.to.fp16.f32(
@@ -71,7 +72,7 @@ void foo(void) {
// CHECK: call float @llvm.convert.from.fp16.f32(
// CHECK: fdiv float
// CHECK: call i16 @llvm.convert.to.fp16.f32(
- h1 = (h0 / (__fp16) -2.0);
+ h1 = (h0 / (__fp16) -2.0f);
// CHECK: call float @llvm.convert.from.fp16.f32(
// CHECK: fdiv float
// CHECK: call i16 @llvm.convert.to.fp16.f32(
@@ -109,7 +110,7 @@ void foo(void) {
// CHECK: call float @llvm.convert.from.fp16.f32(
// CHECK: fsub float
// CHECK: call i16 @llvm.convert.to.fp16.f32(
- h1 = ((__fp16)-2.0 - h0);
+ h1 = ((__fp16)-2.0f - h0);
// CHECK: call float @llvm.convert.from.fp16.f32(
// CHECK: fsub float
// CHECK: call i16 @llvm.convert.to.fp16.f32(
@@ -218,7 +219,7 @@ void foo(void) {
// Check assignments (inc. compound)
h0 = h1;
// CHECK: call i16 @llvm.convert.to.fp16.f32(
- h0 = (__fp16)-2.0;
+ h0 = (__fp16)-2.0f;
// CHECK: call i16 @llvm.convert.to.fp16.f32(
h0 = f0;
@@ -231,7 +232,7 @@ void foo(void) {
// CHECK: call float @llvm.convert.from.fp16.f32(
// CHECK: fadd
// CHECK: call i16 @llvm.convert.to.fp16.f32(
- h0 += (__fp16)1.0;
+ h0 += (__fp16)1.0f;
// CHECK: call float @llvm.convert.from.fp16.f32(
// CHECK: fadd
// CHECK: call i16 @llvm.convert.to.fp16.f32(
@@ -281,4 +282,19 @@ void foo(void) {
// CHECK: fdiv
// CHECK: call i16 @llvm.convert.to.fp16.f32(
h0 /= f2;
+
+ // Check conversions to/from double
+ // CHECK: call i16 @llvm.convert.to.fp16.f64(
+ h0 = d0;
+
+ // CHECK: [[MID:%.*]] = fptrunc double {{%.*}} to float
+ // CHECK: call i16 @llvm.convert.to.fp16.f32(float [[MID]])
+ h0 = (float)d0;
+
+ // CHECK: call double @llvm.convert.from.fp16.f64(
+ d0 = h0;
+
+ // CHECK: [[MID:%.*]] = call float @llvm.convert.from.fp16.f32(
+ // CHECK: fpext float [[MID]] to double
+ d0 = (float)h0;
}
More information about the cfe-commits
mailing list