[ESIMD] Fix the unary math operations accepting saturation tag; fix ext_math.cpp test

v-klochkov · v-klochkov · commit 37ddd6c14752 · 2023-08-16T13:36:18.000-07:00
The test ext_math.cpp needed the fix for half type to avoid having NaNs in
inputs.

Signed-off-by: Vyacheslav N Klochkov &lt;vyacheslav.n.klochkov@intel.com&gt;
diff --git a/sycl/include/sycl/ext/intel/esimd/math.hpp b/sycl/include/sycl/ext/intel/esimd/math.hpp
@@ -46,7 +46,7 @@ namespace ext::intel::esimd {
 /// The following conversions are supported:
 /// - \c T0 and \c T1 is the same floating-point type (including \c half). In
 ///   this case the result in the \c i'th lane is:
-///     * \c -1 if \c src[i] is less than \c -1
+///     * \c 0 if \c src[i] is less than \c 0
 ///     * \c 1 if  \c src[i] is greater than \c 1
 ///     * src[i] otherwise
 ///
@@ -352,7 +352,7 @@ ESIMD_NODEBUG
     if constexpr (std::is_same_v<Sat, saturation_off_tag>)                     \
       return res;                                                              \
     else                                                                       \
-      return esimd::saturate<T>(res);                                          \
+      return esimd::saturate<T>(simd<T, N>(res));                              \
   }                                                                            \
                                                                                \
   /** Scalar version.                                                       */ \
diff --git a/sycl/test-e2e/ESIMD/ext_math.cpp b/sycl/test-e2e/ESIMD/ext_math.cpp
@@ -29,6 +29,18 @@
 using namespace sycl;
 using namespace sycl::ext::intel;
 
+#ifdef SATURATION_ON
+#define ESIMD_SATURATION_TAG                                                   \
+  esimd::saturation_on_tag {}
+#define ESIMD_SATURATE(T, x) esimd::saturate<T>(x)
+#define HOST_SATURATE(x) std::max(0.0f, std::min((x), 1.0f))
+#else
+#define ESIMD_SATURATION_TAG                                                   \
+  esimd::saturation_off_tag {}
+#define ESIMD_SATURATE(T, x) (x)
+#define HOST_SATURATE(x) (x)
+#endif
+
 // --- Data initialization functions
 
 // Initialization data for trigonometric functions' input.
@@ -105,22 +117,17 @@ enum class MathOp {
 
 // --- Template functions calculating given math operation on host and device
 
-enum ArgKind {
-  AllVec,
-  AllSca,
-  Sca1Vec2,
-  Sca2Vec1
-};
+enum ArgKind { AllVec, AllSca, Sca1Vec2, Sca2Vec1 };
 
-template <class T, int N, MathOp Op, int Args=AllVec> struct ESIMDf;
-template <class T, int N, MathOp Op, int Args=AllVec> struct BinESIMDf;
-template <class T, int N, MathOp Op, int Args=AllVec> struct SYCLf;
+template <class T, int N, MathOp Op, int Args = AllVec> struct ESIMDf;
+template <class T, int N, MathOp Op, int Args = AllVec> struct BinESIMDf;
+template <class T, int N, MathOp Op, int Args = AllVec> struct SYCLf;
 
 template <class T, MathOp Op> struct HostFunc;
 
 #define DEFINE_HOST_OP(Op, HostOp)                                             \
   template <class T> struct HostFunc<T, MathOp::Op> {                          \
-    T operator()(T X) { return HostOp; }                                       \
+    T operator()(T X) { return HOST_SATURATE(HostOp); }                        \
   };
 
 DEFINE_HOST_OP(sin, std::sin(X));
@@ -139,7 +146,7 @@ DEFINE_HOST_OP(log2, std::log2(X));
 
 #define DEFINE_HOST_BIN_OP(Op, HostOp)                                         \
   template <class T> struct HostFunc<T, MathOp::Op> {                          \
-    T operator()(T X, T Y) { return HostOp; }                                  \
+    T operator()(T X, T Y) { return HOST_SATURATE(HostOp); }                   \
   };
 
 DEFINE_HOST_BIN_OP(div_ieee, X / Y);
@@ -151,12 +158,12 @@ DEFINE_HOST_BIN_OP(pow, std::pow(X, Y));
   template <class T, int N> struct ESIMDf<T, N, MathOp::Op, AllVec> {          \
     esimd::simd<T, N>                                                          \
     operator()(esimd::simd<T, N> X) const SYCL_ESIMD_FUNCTION {                \
-      return esimd::Op<T, N>(X);                                               \
+      return esimd::Op<T, N>(X, ESIMD_SATURATION_TAG);                         \
     }                                                                          \
   };                                                                           \
   template <class T, int N> struct ESIMDf<T, N, MathOp::Op, AllSca> {          \
     esimd::simd<T, N> operator()(T X) const SYCL_ESIMD_FUNCTION {              \
-      return esimd::Op<T, N>(X);                                               \
+      return esimd::Op<T, N>(X, ESIMD_SATURATION_TAG);                         \
     }                                                                          \
   };
 
@@ -177,26 +184,26 @@ DEFINE_ESIMD_DEVICE_OP(log2);
 #define DEFINE_ESIMD_DEVICE_BIN_OP(Op)                                         \
   template <class T, int N> struct BinESIMDf<T, N, MathOp::Op, AllSca> {       \
     esimd::simd<T, N> operator()(T X, T Y) const SYCL_ESIMD_FUNCTION {         \
-      return esimd::Op<T, N>(X, Y);                                            \
+      return esimd::Op<T, N>(X, Y, ESIMD_SATURATION_TAG);                      \
     }                                                                          \
   };                                                                           \
   template <class T, int N> struct BinESIMDf<T, N, MathOp::Op, AllVec> {       \
     esimd::simd<T, N>                                                          \
     operator()(esimd::simd<T, N> X,                                            \
                esimd::simd<T, N> Y) const SYCL_ESIMD_FUNCTION {                \
-      return esimd::Op<T, N>(X, Y);                                            \
+      return esimd::Op<T, N>(X, Y, ESIMD_SATURATION_TAG);                      \
     }                                                                          \
   };                                                                           \
   template <class T, int N> struct BinESIMDf<T, N, MathOp::Op, Sca1Vec2> {     \
     esimd::simd<T, N>                                                          \
     operator()(T X, esimd::simd<T, N> Y) const SYCL_ESIMD_FUNCTION {           \
-      return esimd::Op<T, N>(X, Y);                                            \
+      return esimd::Op<T, N>(X, Y, ESIMD_SATURATION_TAG);                      \
     }                                                                          \
   };                                                                           \
   template <class T, int N> struct BinESIMDf<T, N, MathOp::Op, Sca2Vec1> {     \
     esimd::simd<T, N> operator()(esimd::simd<T, N> X,                          \
                                  T Y) const SYCL_ESIMD_FUNCTION {              \
-      return esimd::Op<T, N>(X, Y);                                            \
+      return esimd::Op<T, N>(X, Y, ESIMD_SATURATION_TAG);                      \
     }                                                                          \
   };
 
@@ -208,12 +215,12 @@ DEFINE_ESIMD_DEVICE_BIN_OP(pow);
     esimd::simd<T, N>                                                          \
     operator()(esimd::simd<T, N> X) const SYCL_ESIMD_FUNCTION {                \
       /* T must be float for SYCL, so not a template parameter for sycl::Op*/  \
-      return sycl::Op<N>(X);                                                   \
+      return ESIMD_SATURATE(T, sycl::Op<N>(X));                                \
     }                                                                          \
   };                                                                           \
   template <class T, int N> struct SYCLf<T, N, MathOp::Op, AllSca> {           \
     esimd::simd<T, N> operator()(T X) const SYCL_ESIMD_FUNCTION {              \
-      return sycl::Op<N>(X);                                                   \
+      return ESIMD_SATURATE(T, sycl::Op<N>(X));                                \
     }                                                                          \
   };
 
@@ -307,10 +314,11 @@ struct BinaryDeviceFunc {
 template <class T, int N, MathOp Op,
           template <class, int, MathOp, int> class Kernel,
           typename InitF = InitNarrow<T>>
-bool test(queue &Q, const std::string &Name,
-          InitF Init = InitNarrow<T>{}, float delta = 0.0f) {
+bool test(queue &Q, const std::string &Name, InitF Init = InitNarrow<T>{},
+          float delta = 0.0f) {
 
-  constexpr size_t Size = 1024 * 128;
+  constexpr size_t Size =
+      std::is_same_v<T, sycl::half> ? (16 * 128) : (1024 * 128);
   constexpr bool IsBinOp = (Op == MathOp::div_ieee) || (Op == MathOp::pow);
 
   T *A = new T[Size];
@@ -322,9 +330,9 @@ bool test(queue &Q, const std::string &Name,
     Init(A, B, Size);
   }
   const char *kind =
-    std::is_same_v<Kernel<T, N, Op, AllVec>, ESIMDf<T, N, Op, AllVec>>
-                         ? "ESIMD"
-                         : "SYCL";
+      std::is_same_v<Kernel<T, N, Op, AllVec>, ESIMDf<T, N, Op, AllVec>>
+          ? "ESIMD"
+          : "SYCL";
   std::cout << "  " << Name << " test, kind=" << kind << "...\n";
 
   try {
@@ -343,12 +351,11 @@ bool test(queue &Q, const std::string &Name,
       auto PC = BufC.template get_access<access::mode::write>(CGH);
       if constexpr (IsBinOp) {
         auto PB = BufB.template get_access<access::mode::read>(CGH);
-        BinaryDeviceFunc<T, N, Op, Kernel, decltype(PA), decltype(PC)> F(
-            PA, PB, PC);
+        BinaryDeviceFunc<T, N, Op, Kernel, decltype(PA), decltype(PC)> F(PA, PB,
+                                                                         PC);
         CGH.parallel_for(nd_range<1>{GlobalRange, LocalRange}, F);
       } else {
-        UnaryDeviceFunc<T, N, Op, Kernel, decltype(PA), decltype(PC)> F(PA,
-                                                                        PC);
+        UnaryDeviceFunc<T, N, Op, Kernel, decltype(PA), decltype(PC)> F(PA, PC);
         CGH.parallel_for(nd_range<1>{GlobalRange, LocalRange}, F);
       }
     });
@@ -384,6 +391,7 @@ bool test(queue &Q, const std::string &Name,
       if (++ErrCnt < 10) {
         std::cout << "    failed at index " << I << ", " << Test
                   << " != " << Gold << " (gold)\n";
+        std::cout << "A = " << (T)A[I] << ", B = " << (T)B[I] << "\n";
       }
     }
   }
@@ -442,10 +450,9 @@ template <class T, int N> bool testESIMDDivIEEE(queue &Q) {
 
 template <class T, int N> bool testESIMDPow(queue &Q) {
   bool Pass = true;
-  std::cout << "--- TESTING ESIMD pow, T=" << typeid(T).name()
-            << ", N = " << N << "...\n";
-  Pass &= test<T, N, MathOp::pow, BinESIMDf>(
-      Q, "pow", InitBin<T>{}, 0.1);
+  std::cout << "--- TESTING ESIMD pow, T=" << typeid(T).name() << ", N = " << N
+            << "...\n";
+  Pass &= test<T, N, MathOp::pow, BinESIMDf>(Q, "pow", InitBin<T>{}, 0.1);
   return Pass;
 }
 
@@ -479,7 +486,7 @@ int main(void) {
     Pass &= testESIMDSqrtIEEE<double, 32>(Q);
     Pass &= testESIMDDivIEEE<double, 32>(Q);
   }
-#else  // !TEST_IEEE_DIV_REM
+#else // !TEST_IEEE_DIV_REM
   Pass &= testESIMD<half, 8>(Q);
   Pass &= testESIMD<float, 16>(Q);
   Pass &= testESIMD<float, 32>(Q);
diff --git a/sycl/test-e2e/ESIMD/ext_math_saturate.cpp b/sycl/test-e2e/ESIMD/ext_math_saturate.cpp
@@ -0,0 +1,23 @@
+//==----------- ext_math_saturate.cpp  - DPC++ ESIMD extended math test ----==//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+//===----------------------------------------------------------------------===//
+// DEFINE: %{mathflags} = %if cl_options %{/clang:-fno-fast-math%} %else %{-fno-fast-math%}
+// RUN: %{build} -fsycl-device-code-split=per_kernel %{mathflags} -o %t.out
+// RUN: %{run} %t.out
+
+// FIXME: enable opaque pointers support
+// REQUIRES: TEMPORARY_DISABLED
+
+// This test checks extended math operations called with saturation.
+// Combinations of
+// - argument type - half, float
+// - math function - sin, cos, ..., div_ieee, pow
+// - SYCL vs ESIMD APIs
+
+#define SATURATION_ON
+
+#include "ext_math.cpp"