amdgcn/fmax: fcanonicalize operands v_max instruction needs canonicalized operands. Passes CTS on carrizo Reviewer: Aaron Watry <awatry@gmail.com> Signed-off-by: Jan Vesely <jan.vesely@rutgers.edu> git-svn-id: https://llvm.org/svn/llvm-project/libclc/trunk@327076 91177308-0d34-0410-b5e6-96231b3b80d8

commit: a8b683ef7dd2fe729ef18167283502c29e6d9090 [log] [tgz]
author: Jan Vesely <jan.vesely@rutgers.edu> Thu Mar 08 23:01:01 2018 +0000
committer: Jan Vesely <jan.vesely@rutgers.edu> Thu Mar 08 23:01:01 2018 +0000
tree: f797ca8e1491ec4fe827cd8c766bcfaaf17779e5
parent: 443a7c38139df81d858e00a3e4864f9a43e03aff [diff]
diff --git a/amdgcn/lib/SOURCES b/amdgcn/lib/SOURCES
index 9cdc7b8..44c088c 100644
--- a/amdgcn/lib/SOURCES
+++ b/amdgcn/lib/SOURCES

@@ -1,5 +1,6 @@
 cl_khr_int64_extended_atomics/minmax_helpers.ll
 integer/popcount.cl
+math/fmax.cl
 math/fmin.cl
 math/ldexp.cl
 mem_fence/fence.cl

diff --git a/amdgcn/lib/math/fmax.cl b/amdgcn/lib/math/fmax.cl
new file mode 100644
index 0000000..c1e6cb9
--- /dev/null
+++ b/amdgcn/lib/math/fmax.cl

@@ -0,0 +1,31 @@
+#include <clc/clc.h>
+
+#include "../../../generic/lib/clcmacro.h"
+
+_CLC_DEF _CLC_OVERLOAD float fmax(float x, float y)
+{
+   /* fcanonicalize removes sNaNs and flushes denormals if not enabled.
+    * Otherwise fmax instruction flushes the values for comparison,
+    * but outputs original denormal */
+   x = __builtin_canonicalizef(x);
+   y = __builtin_canonicalizef(y);
+   return __builtin_fmaxf(x, y);
+}
+_CLC_BINARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, float, fmax, float, float)
+
+#ifdef cl_khr_fp64
+
+#pragma OPENCL EXTENSION cl_khr_fp64 : enable
+
+_CLC_DEF _CLC_OVERLOAD double fmax(double x, double y)
+{
+   x = __builtin_canonicalize(x);
+   y = __builtin_canonicalize(y);
+   return __builtin_fmax(x, y);
+}
+_CLC_BINARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, double, fmax, double, double)
+
+#endif
+
+#define __CLC_BODY <../../../generic/lib/math/fmax.inc>
+#include <clc/math/gentype.inc>
commit	a8b683ef7dd2fe729ef18167283502c29e6d9090	[log] [tgz]
author	Jan Vesely <jan.vesely@rutgers.edu>	Thu Mar 08 23:01:01 2018 +0000
committer	Jan Vesely <jan.vesely@rutgers.edu>	Thu Mar 08 23:01:01 2018 +0000
tree	f797ca8e1491ec4fe827cd8c766bcfaaf17779e5
parent	443a7c38139df81d858e00a3e4864f9a43e03aff [diff]