[Libclc-dev] [PATCH 1/2] amdgcn/fmin: fcanonicalize operands

Tue Mar 6 09:31:02 PST 2018

v_min instruction needs canonicalized operands.
Passes CTS on carrizo
Fixes minmag CTS on carrizo

Signed-off-by: Jan Vesely <jan.vesely at rutgers.edu>
---
 amdgcn/lib/SOURCES      |  1 +
 amdgcn/lib/math/fmin.cl | 31 +++++++++++++++++++++++++++++++
 2 files changed, 32 insertions(+)
 create mode 100644 amdgcn/lib/math/fmin.cl

diff --git a/amdgcn/lib/SOURCES b/amdgcn/lib/SOURCES
index 8e14ce2..95cc276 100644
--- a/amdgcn/lib/SOURCES
+++ b/amdgcn/lib/SOURCES
@@ -1,4 +1,5 @@
 cl_khr_int64_extended_atomics/minmax_helpers.ll
+math/fmin.cl
 math/ldexp.cl
 mem_fence/fence.cl
 synchronization/barrier.cl
diff --git a/amdgcn/lib/math/fmin.cl b/amdgcn/lib/math/fmin.cl
new file mode 100644
index 0000000..6a11785
--- /dev/null
+++ b/amdgcn/lib/math/fmin.cl
@@ -0,0 +1,31 @@
+#include <clc/clc.h>
+
+#include "../../../generic/lib/clcmacro.h"
+
+_CLC_DEF _CLC_OVERLOAD float fmin(float x, float y)
+{
+   /* fcanonicalize removes sNaNs and flushes denormals if not enabled.
+    * Otherwise fmin instruction flushes the values for comparison,
+    * but outputs original denormal */
+   x = __builtin_canonicalizef(x);
+   y = __builtin_canonicalizef(y);
+   return __builtin_fminf(x, y);
+}
+_CLC_BINARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, float, fmin, float, float)
+
+#ifdef cl_khr_fp64
+
+#pragma OPENCL EXTENSION cl_khr_fp64 : enable
+
+_CLC_DEF _CLC_OVERLOAD double fmin(double x, double y)
+{
+   x = __builtin_canonicalize(x);
+   y = __builtin_canonicalize(y);
+   return __builtin_fmin(x, y);
+}
+_CLC_BINARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, double, fmin, double, double)
+
+#endif
+
+#define __CLC_BODY <../../../generic/lib/math/fmin.inc>
+#include <clc/math/gentype.inc>
-- 
2.14.3