[libclc] r327076 - amdgcn/fmax: fcanonicalize operands
Jan Vesely via cfe-commits
cfe-commits at lists.llvm.org
Thu Mar 8 15:01:01 PST 2018
Author: jvesely
Date: Thu Mar 8 15:01:01 2018
New Revision: 327076
URL: http://llvm.org/viewvc/llvm-project?rev=327076&view=rev
Log:
amdgcn/fmax: fcanonicalize operands
v_max instruction needs canonicalized operands.
Passes CTS on carrizo
Reviewer: Aaron Watry <awatry at gmail.com>
Signed-off-by: Jan Vesely <jan.vesely at rutgers.edu>
Added:
libclc/trunk/amdgcn/lib/math/fmax.cl
Modified:
libclc/trunk/amdgcn/lib/SOURCES
Modified: libclc/trunk/amdgcn/lib/SOURCES
URL: http://llvm.org/viewvc/llvm-project/libclc/trunk/amdgcn/lib/SOURCES?rev=327076&r1=327075&r2=327076&view=diff
==============================================================================
--- libclc/trunk/amdgcn/lib/SOURCES (original)
+++ libclc/trunk/amdgcn/lib/SOURCES Thu Mar 8 15:01:01 2018
@@ -1,5 +1,6 @@
cl_khr_int64_extended_atomics/minmax_helpers.ll
integer/popcount.cl
+math/fmax.cl
math/fmin.cl
math/ldexp.cl
mem_fence/fence.cl
Added: libclc/trunk/amdgcn/lib/math/fmax.cl
URL: http://llvm.org/viewvc/llvm-project/libclc/trunk/amdgcn/lib/math/fmax.cl?rev=327076&view=auto
==============================================================================
--- libclc/trunk/amdgcn/lib/math/fmax.cl (added)
+++ libclc/trunk/amdgcn/lib/math/fmax.cl Thu Mar 8 15:01:01 2018
@@ -0,0 +1,31 @@
+#include <clc/clc.h>
+
+#include "../../../generic/lib/clcmacro.h"
+
+_CLC_DEF _CLC_OVERLOAD float fmax(float x, float y)
+{
+ /* fcanonicalize removes sNaNs and flushes denormals if not enabled.
+ * Otherwise fmax instruction flushes the values for comparison,
+ * but outputs original denormal */
+ x = __builtin_canonicalizef(x);
+ y = __builtin_canonicalizef(y);
+ return __builtin_fmaxf(x, y);
+}
+_CLC_BINARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, float, fmax, float, float)
+
+#ifdef cl_khr_fp64
+
+#pragma OPENCL EXTENSION cl_khr_fp64 : enable
+
+_CLC_DEF _CLC_OVERLOAD double fmax(double x, double y)
+{
+ x = __builtin_canonicalize(x);
+ y = __builtin_canonicalize(y);
+ return __builtin_fmax(x, y);
+}
+_CLC_BINARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, double, fmax, double, double)
+
+#endif
+
+#define __CLC_BODY <../../../generic/lib/math/fmax.inc>
+#include <clc/math/gentype.inc>
More information about the cfe-commits
mailing list