llvm-docs/doxygen/ompat_2math_8hpp_source.html

 /***************************************************************************

  *

  *  Copyright (C) Codeplay Software Ltd.

  *

  *  Part of the LLVM Project, under the Apache License v2.0 with LLVM

  *  Exceptions. See https://llvm.org/LICENSE.txt for license information.

  *  SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

  *

  *  Unless required by applicable law or agreed to in writing, software

  *  distributed under the License is distributed on an "AS IS" BASIS,

  *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

  *  See the License for the specific language governing permissions and

  *  limitations under the License.

  *

  *  SYCL compatibility extension

  *

  *  math.hpp

  *

  *  Description:

  *    math utilities for the SYCL compatibility extension.

  **************************************************************************/


 // The original source was under the license below:

 //==---- math.hpp ---------------------------------*- C++ -*----------------==//

 //

 // Copyright (C) Intel Corporation

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 // See https://llvm.org/LICENSE.txt for license information.

 //

 //===----------------------------------------------------------------------===//


 #pragma once


 #include <sycl/sycl.hpp>


 #ifndef SYCL_EXT_ONEAPI_COMPLEX

 #define SYCL_EXT_ONEAPI_COMPLEX

 #endif


 #include <sycl/ext/oneapi/experimental/complex/complex.hpp>


 namespace syclcompat {

 namespace detail {


 namespace complex_namespace = sycl::ext::oneapi::experimental;


 template <typename ValueT>

 using complex_type = detail::complex_namespace::complex<ValueT>;


 template <typename ValueT>

 inline ValueT clamp(ValueT val, ValueT min_val, ValueT max_val) {

   return sycl::clamp(val, min_val, max_val);

 }


 #ifdef SYCL_EXT_ONEAPI_BFLOAT16_MATH_FUNCTIONS

 // TODO: Follow the process to add this to the extension. If added,

 // remove this functionality from the header.

 template <>

 inline sycl::ext::oneapi::bfloat16 clamp(sycl::ext::oneapi::bfloat16 val,

                                          sycl::ext::oneapi::bfloat16 min_val,

                                          sycl::ext::oneapi::bfloat16 max_val) {

   if (val < min_val)

     return min_val;

   if (val > max_val)

     return max_val;

   return val;

 }

 #endif


 template <typename VecT, class BinaryOperation, class = void>

 class vectorized_binary {

 public:

   inline VecT operator()(VecT a, VecT b, const BinaryOperation binary_op) {

     VecT v4;

     for (size_t i = 0; i < v4.size(); ++i) {

       v4[i] = binary_op(a[i], b[i]);

     }

     return v4;

   }

 };


 template <typename ValueT>

 inline int64_t zero_or_signed_extent(ValueT val, unsigned bit) {

   if constexpr (std::is_signed_v<ValueT>) {

     return int64_t(val) << (64 - bit) >> (64 - bit);

   }

   return val;

 }


 template <typename RetT, bool needSat, typename AT, typename BT,

           typename BinaryOperation>

 inline constexpr RetT extend_binary(AT a, BT b, BinaryOperation binary_op) {

   const int64_t extend_a = zero_or_signed_extent(a, 33);

   const int64_t extend_b = zero_or_signed_extent(b, 33);

   const int64_t ret = binary_op(extend_a, extend_b);

   if constexpr (needSat)

     return detail::clamp<int64_t>(ret, std::numeric_limits<RetT>::min(),

                                   std::numeric_limits<RetT>::max());

   return ret;

 }


 template <typename RetT, bool needSat, typename AT, typename BT, typename CT,

           typename BinaryOperation1, typename BinaryOperation2>

 inline constexpr RetT extend_binary(AT a, BT b, CT c,

                                     BinaryOperation1 binary_op,

                                     BinaryOperation2 second_op) {

   const int64_t extend_a = zero_or_signed_extent(a, 33);

   const int64_t extend_b = zero_or_signed_extent(b, 33);

   int64_t extend_temp =

       zero_or_signed_extent(binary_op(extend_a, extend_b), 34);

   if constexpr (needSat)

     extend_temp =

         detail::clamp<int64_t>(extend_temp, std::numeric_limits<RetT>::min(),

                                std::numeric_limits<RetT>::max());

   const int64_t extend_c = zero_or_signed_extent(c, 33);

   return second_op(extend_temp, extend_c);

 }


 template <typename ValueT> inline bool isnan(const ValueT a) {

   return sycl::isnan(a);

 }

 #ifdef SYCL_EXT_ONEAPI_BFLOAT16_MATH_FUNCTIONS

 inline bool isnan(const sycl::ext::oneapi::bfloat16 a) {

   return sycl::ext::oneapi::experimental::isnan(a);

 }

 #endif


 } // namespace detail


 inline float fast_length(const float *a, int len) {

   switch (len) {

   case 1:

     return sycl::fast_length(a[0]);

   case 2:

     return sycl::fast_length(sycl::float2(a[0], a[1]));

   case 3:

     return sycl::fast_length(sycl::float3(a[0], a[1], a[2]));

   case 4:

     return sycl::fast_length(sycl::float4(a[0], a[1], a[2], a[3]));

   case 0:

     return 0;

   default:

     float f = 0;

     for (int i = 0; i < len; ++i)

       f += a[i] * a[i];

     return sycl::sqrt(f);

   }

 }


 template <typename ValueT>

 inline ValueT length(const ValueT *a, const int len) {

   switch (len) {

   case 1:

     return a[0];

   case 2:

     return sycl::length(sycl::vec<ValueT, 2>(a[0], a[1]));

   case 3:

     return sycl::length(sycl::vec<ValueT, 3>(a[0], a[1], a[2]));

   case 4:

     return sycl::length(sycl::vec<ValueT, 4>(a[0], a[1], a[2], a[3]));

   default:

     ValueT ret = 0;

     for (int i = 0; i < len; ++i)

       ret += a[i] * a[i];

     return sycl::sqrt(ret);

   }

 }


 template <typename ValueT, class BinaryOperation>

 inline std::enable_if_t<

     std::is_same_v<std::invoke_result_t<BinaryOperation, ValueT, ValueT>, bool>,

     bool>

 compare(const ValueT a, const ValueT b, const BinaryOperation binary_op) {

   return binary_op(a, b);

 }

 template <typename ValueT>

 inline std::enable_if_t<

     std::is_same_v<std::invoke_result_t<std::not_equal_to<>, ValueT, ValueT>,

                    bool>,

     bool>

 compare(const ValueT a, const ValueT b, const std::not_equal_to<> binary_op) {

   return !detail::isnan(a) && !detail::isnan(b) && binary_op(a, b);

 }


 template <typename ValueT, class BinaryOperation>

 inline std::enable_if_t<ValueT::size() == 2, ValueT>

 compare(const ValueT a, const ValueT b, const BinaryOperation binary_op) {

   return {compare(a[0], b[0], binary_op), compare(a[1], b[1], binary_op)};

 }


 template <typename ValueT, class BinaryOperation>

 inline std::enable_if_t<

     std::is_same_v<std::invoke_result_t<BinaryOperation, ValueT, ValueT>, bool>,

     bool>

 unordered_compare(const ValueT a, const ValueT b,

                   const BinaryOperation binary_op) {

   return detail::isnan(a) || detail::isnan(b) || binary_op(a, b);

 }


 template <typename ValueT, class BinaryOperation>

 inline std::enable_if_t<ValueT::size() == 2, ValueT>

 unordered_compare(const ValueT a, const ValueT b,

                   const BinaryOperation binary_op) {

   return {unordered_compare(a[0], b[0], binary_op),

           unordered_compare(a[1], b[1], binary_op)};

 }


 template <typename ValueT, class BinaryOperation>

 inline std::enable_if_t<ValueT::size() == 2, bool>

 compare_both(const ValueT a, const ValueT b, const BinaryOperation binary_op) {

   return compare(a[0], b[0], binary_op) && compare(a[1], b[1], binary_op);

 }


 template <typename ValueT, class BinaryOperation>

 inline std::enable_if_t<ValueT::size() == 2, bool>

 unordered_compare_both(const ValueT a, const ValueT b,

                        const BinaryOperation binary_op) {

   return unordered_compare(a[0], b[0], binary_op) &&

          unordered_compare(a[1], b[1], binary_op);

 }


 template <typename ValueT, class BinaryOperation>

 inline unsigned compare_mask(const sycl::vec<ValueT, 2> a,

                              const sycl::vec<ValueT, 2> b,

                              const BinaryOperation binary_op) {

   // Since compare returns 0 or 1, -compare will be 0x00000000 or 0xFFFFFFFF

   return ((-compare(a[0], b[0], binary_op)) << 16) |

          ((-compare(a[1], b[1], binary_op)) & 0xFFFF);

 }


 template <typename ValueT, class BinaryOperation>

 inline unsigned unordered_compare_mask(const sycl::vec<ValueT, 2> a,

                                        const sycl::vec<ValueT, 2> b,

                                        const BinaryOperation binary_op) {

   return ((-unordered_compare(a[0], b[0], binary_op)) << 16) |

          ((-unordered_compare(a[1], b[1], binary_op)) & 0xFFFF);

 }


 template <typename S, typename T> inline T vectorized_max(T a, T b) {

   sycl::vec<T, 1> v0{a}, v1{b};

   auto v2 = v0.template as<S>();

   auto v3 = v1.template as<S>();

   v2 = sycl::max(v2, v3);

   v0 = v2.template as<sycl::vec<T, 1>>();

   return v0;

 }


 template <typename S, typename T> inline T vectorized_min(T a, T b) {

   sycl::vec<T, 1> v0{a}, v1{b};

   auto v2 = v0.template as<S>();

   auto v3 = v1.template as<S>();

   v2 = sycl::min(v2, v3);

   v0 = v2.template as<sycl::vec<T, 1>>();

   return v0;

 }


 template <typename VecT, class UnaryOperation>

 inline unsigned vectorized_unary(unsigned a, const UnaryOperation unary_op) {

   sycl::vec<unsigned, 1> v0{a};

   auto v1 = v0.as<VecT>();

   auto v2 = unary_op(v1);

   v0 = v2.template as<sycl::vec<unsigned, 1>>();

   return v0;

 }


 template <typename VecT>

 inline unsigned vectorized_sum_abs_diff(unsigned a, unsigned b) {

   sycl::vec<unsigned, 1> v0{a}, v1{b};

   auto v2 = v0.as<VecT>();

   auto v3 = v1.as<VecT>();

   auto v4 = sycl::abs_diff(v2, v3);

   unsigned sum = 0;

   for (size_t i = 0; i < v4.size(); ++i) {

     sum += v4[i];

   }

   return sum;

 }


 template <typename S, typename T> inline T vectorized_isgreater(T a, T b) {

   sycl::vec<T, 1> v0{a}, v1{b};

   auto v2 = v0.template as<S>();

   auto v3 = v1.template as<S>();

   auto v4 = sycl::isgreater(v2, v3);

   v0 = v4.template as<sycl::vec<T, 1>>();

   return v0;

 }


 template <>

 inline unsigned vectorized_isgreater<sycl::ushort2, unsigned>(unsigned a,

                                                               unsigned b) {

   sycl::vec<unsigned, 1> v0{a}, v1{b};

   auto v2 = v0.template as<sycl::ushort2>();

   auto v3 = v1.template as<sycl::ushort2>();

   sycl::ushort2 v4;

   v4[0] = v2[0] > v3[0];

   v4[1] = v2[1] > v3[1];

   v0 = v4.template as<sycl::vec<unsigned, 1>>();

   return v0;

 }


 template <typename ValueT>

 inline ValueT clamp(ValueT val, ValueT min_val, ValueT max_val) {

   return detail::clamp(val, min_val, max_val);

 }


 template <typename ValueT>

 inline std::enable_if_t<ValueT::size() == 2, ValueT> isnan(const ValueT a) {

   return {detail::isnan(a[0]), detail::isnan(a[1])};

 }


 template <typename ValueT>

 inline std::enable_if_t<std::is_floating_point_v<ValueT> ||

                             std::is_same_v<sycl::half, ValueT>,

                         ValueT>

 cbrt(ValueT val) {

   return sycl::cbrt(static_cast<ValueT>(val));

 }


 // min/max function overloads.

 // For floating-point types, `float` or `double` arguments are acceptable.

 // For integer types, `std::uint32_t`, `std::int32_t`, `std::uint64_t` or

 // `std::int64_t` type arguments are acceptable.

 // sycl::half supported as well.

 template <typename ValueT, typename ValueU>

 std::enable_if_t<std::is_integral_v<ValueT> && std::is_integral_v<ValueU>,

                  std::common_type_t<ValueT, ValueU>>

 min(ValueT a, ValueU b) {

   return sycl::min(static_cast<std::common_type_t<ValueT, ValueU>>(a),

                    static_cast<std::common_type_t<ValueT, ValueU>>(b));

 }

 template <typename ValueT, typename ValueU>

 std::enable_if_t<std::is_floating_point_v<ValueT> &&

                      std::is_floating_point_v<ValueU>,

                  std::common_type_t<ValueT, ValueU>>

 min(ValueT a, ValueU b) {

   return sycl::fmin(static_cast<std::common_type_t<ValueT, ValueU>>(a),

                     static_cast<std::common_type_t<ValueT, ValueU>>(b));

 }

 sycl::half min(sycl::half a, sycl::half b) { return sycl::fmin(a, b); }


 template <typename ValueT, typename ValueU>

 std::enable_if_t<std::is_integral_v<ValueT> && std::is_integral_v<ValueU>,

                  std::common_type_t<ValueT, ValueU>>

 max(ValueT a, ValueU b) {

   return sycl::max(static_cast<std::common_type_t<ValueT, ValueU>>(a),

                    static_cast<std::common_type_t<ValueT, ValueU>>(b));

 }

 template <typename ValueT, typename ValueU>

 std::enable_if_t<std::is_floating_point_v<ValueT> &&

                      std::is_floating_point_v<ValueU>,

                  std::common_type_t<ValueT, ValueU>>

 max(ValueT a, ValueU b) {

   return sycl::fmax(static_cast<std::common_type_t<ValueT, ValueU>>(a),

                     static_cast<std::common_type_t<ValueT, ValueU>>(b));

 }

 sycl::half max(sycl::half a, sycl::half b) { return sycl::fmax(a, b); }


 template <typename ValueT, typename ValueU>

 inline std::common_type_t<ValueT, ValueU> fmax_nan(const ValueT a,

                                                    const ValueU b) {

   if (detail::isnan(a) || detail::isnan(b))

     return NAN;

   return sycl::fmax(static_cast<std::common_type_t<ValueT, ValueU>>(a),

                     static_cast<std::common_type_t<ValueT, ValueU>>(b));

 }

 template <typename ValueT, typename ValueU>

 inline sycl::vec<std::common_type_t<ValueT, ValueU>, 2>

 fmax_nan(const sycl::vec<ValueT, 2> a, const sycl::vec<ValueU, 2> b) {

   return {fmax_nan(a[0], b[0]), fmax_nan(a[1], b[1])};

 }


 template <typename ValueT, typename ValueU>

 inline std::common_type_t<ValueT, ValueU> fmin_nan(const ValueT a,

                                                    const ValueU b) {

   if (detail::isnan(a) || detail::isnan(b))

     return NAN;

   return sycl::fmin(static_cast<std::common_type_t<ValueT, ValueU>>(a),

                     static_cast<std::common_type_t<ValueT, ValueU>>(b));

 }

 template <typename ValueT, typename ValueU>

 inline sycl::vec<std::common_type_t<ValueT, ValueU>, 2>

 fmin_nan(const sycl::vec<ValueT, 2> a, const sycl::vec<ValueU, 2> b) {

   return {fmin_nan(a[0], b[0]), fmin_nan(a[1], b[1])};

 }


 // pow functions overload.

 inline float pow(const float a, const int b) { return sycl::pown(a, b); }

 inline double pow(const double a, const int b) { return sycl::pown(a, b); }


 template <typename ValueT, typename ValueU>

 inline typename std::enable_if_t<std::is_floating_point_v<ValueT>, ValueT>

 pow(const ValueT a, const ValueU b) {

   return sycl::pow(a, static_cast<ValueT>(b));

 }


 // TODO: calling pow with non-floating point values is currently defaulting to

 // double, which fails on devices without aspect::fp64. This has to be properly

 // documented, and maybe changed to support all devices.

 template <typename ValueT, typename ValueU>

 inline typename std::enable_if_t<!std::is_floating_point_v<ValueT>, double>

 pow(const ValueT a, const ValueU b) {

   return sycl::pow(static_cast<double>(a), static_cast<double>(b));

 }


 template <typename ValueT>

 inline std::enable_if_t<std::is_floating_point_v<ValueT> ||

                             std::is_same_v<sycl::half, ValueT>,

                         ValueT>

 relu(const ValueT a) {

   if (!detail::isnan(a) && a < ValueT(0))

     return ValueT(0);

   return a;

 }

 template <class ValueT>

 inline std::enable_if_t<std::is_floating_point_v<ValueT> ||

                             std::is_same_v<sycl::half, ValueT>,

                         sycl::vec<ValueT, 2>>

 relu(const sycl::vec<ValueT, 2> a) {

   return {relu(a[0]), relu(a[1])};

 }

 template <class ValueT>

 inline std::enable_if_t<std::is_floating_point_v<ValueT> ||

                             std::is_same_v<sycl::half, ValueT>,

                         sycl::marray<ValueT, 2>>

 relu(const sycl::marray<ValueT, 2> a) {

   return {relu(a[0]), relu(a[1])};

 }


 template <typename T>

 sycl::vec<T, 2> cmul(sycl::vec<T, 2> x, sycl::vec<T, 2> y) {

   sycl::ext::oneapi::experimental::complex<T> t1(x[0], x[1]), t2(y[0], y[1]);

   t1 = t1 * t2;

   return sycl::vec<T, 2>(t1.real(), t1.imag());

 }


 template <typename T>

 sycl::vec<T, 2> cdiv(sycl::vec<T, 2> x, sycl::vec<T, 2> y) {

   sycl::ext::oneapi::experimental::complex<T> t1(x[0], x[1]), t2(y[0], y[1]);

   t1 = t1 / t2;

   return sycl::vec<T, 2>(t1.real(), t1.imag());

 }


 template <typename T> T cabs(sycl::vec<T, 2> x) {

   sycl::ext::oneapi::experimental::complex<T> t(x[0], x[1]);

   return sycl::ext::oneapi::experimental::abs(t);

 }


 template <typename T> sycl::vec<T, 2> conj(sycl::vec<T, 2> x) {

   sycl::ext::oneapi::experimental::complex<T> t(x[0], x[1]);

   t = conj(t);

   return sycl::vec<T, 2>(t.real(), t.imag());

 }


 template <typename ValueT>

 inline sycl::vec<ValueT, 2> cmul_add(const sycl::vec<ValueT, 2> a,

                                      const sycl::vec<ValueT, 2> b,

                                      const sycl::vec<ValueT, 2> c) {

   sycl::ext::oneapi::experimental::complex<ValueT> t(a[0], a[1]);

   sycl::ext::oneapi::experimental::complex<ValueT> u(b[0], b[1]);

   sycl::ext::oneapi::experimental::complex<ValueT> v(c[0], c[1]);

   t = t * u + v;

   return sycl::vec<ValueT, 2>{t.real(), t.imag()};

 }

 template <typename ValueT>

 inline sycl::marray<ValueT, 2> cmul_add(const sycl::marray<ValueT, 2> a,

                                         const sycl::marray<ValueT, 2> b,

                                         const sycl::marray<ValueT, 2> c) {

   sycl::ext::oneapi::experimental::complex<ValueT> t(a[0], a[1]);

   sycl::ext::oneapi::experimental::complex<ValueT> u(b[0], b[1]);

   sycl::ext::oneapi::experimental::complex<ValueT> v(c[0], c[1]);

   t = t * u + v;

   return sycl::marray<ValueT, 2>{t.real(), t.imag()};

 }


 struct abs {

   template <typename ValueT> auto operator()(const ValueT x) const {

     return sycl::abs(x);

   }

 };


 struct abs_diff {

   template <typename ValueT>

   auto operator()(const ValueT x, const ValueT y) const {

     return sycl::abs_diff(x, y);

   }

 };


 struct add_sat {

   template <typename ValueT>

   auto operator()(const ValueT x, const ValueT y) const {

     return sycl::add_sat(x, y);

   }

 };


 struct rhadd {

   template <typename ValueT>

   auto operator()(const ValueT x, const ValueT y) const {

     return sycl::rhadd(x, y);

   }

 };


 struct hadd {

   template <typename ValueT>

   auto operator()(const ValueT x, const ValueT y) const {

     return sycl::hadd(x, y);

   }

 };


 struct maximum {

   template <typename ValueT>

   auto operator()(const ValueT x, const ValueT y) const {

     return sycl::max(x, y);

   }

 };


 struct minimum {

   template <typename ValueT>

   auto operator()(const ValueT x, const ValueT y) const {

     return sycl::min(x, y);

   }

 };


 struct sub_sat {

   template <typename ValueT>

   auto operator()(const ValueT x, const ValueT y) const {

     return sycl::sub_sat(x, y);

   }

 };


 template <typename VecT, class BinaryOperation>

 inline unsigned vectorized_binary(unsigned a, unsigned b,

                                   const BinaryOperation binary_op) {

   sycl::vec<unsigned, 1> v0{a}, v1{b};

   auto v2 = v0.as<VecT>();

   auto v3 = v1.as<VecT>();

   auto v4 =

       detail::vectorized_binary<VecT, BinaryOperation>()(v2, v3, binary_op);

   v0 = v4.template as<sycl::vec<unsigned, 1>>();

   return v0;

 }


 template <typename RetT, typename AT, typename BT>

 inline constexpr RetT extend_add(AT a, BT b) {

   return detail::extend_binary<RetT, false>(a, b, std::plus());

 }


 template <typename RetT, typename AT, typename BT, typename CT,

           typename BinaryOperation>

 inline constexpr RetT extend_add(AT a, BT b, CT c, BinaryOperation second_op) {

   return detail::extend_binary<RetT, false>(a, b, c, std::plus(), second_op);

 }


 template <typename RetT, typename AT, typename BT>

 inline constexpr RetT extend_add_sat(AT a, BT b) {

   return detail::extend_binary<RetT, true>(a, b, std::plus());

 }


 template <typename RetT, typename AT, typename BT, typename CT,

           typename BinaryOperation>

 inline constexpr RetT extend_add_sat(AT a, BT b, CT c,

                                      BinaryOperation second_op) {

   return detail::extend_binary<RetT, true>(a, b, c, std::plus(), second_op);

 }


 template <typename RetT, typename AT, typename BT>

 inline constexpr RetT extend_sub(AT a, BT b) {

   return detail::extend_binary<RetT, false>(a, b, std::minus());

 }


 template <typename RetT, typename AT, typename BT, typename CT,

           typename BinaryOperation>

 inline constexpr RetT extend_sub(AT a, BT b, CT c, BinaryOperation second_op) {

   return detail::extend_binary<RetT, false>(a, b, c, std::minus(), second_op);

 }


 template <typename RetT, typename AT, typename BT>

 inline constexpr RetT extend_sub_sat(AT a, BT b) {

   return detail::extend_binary<RetT, true>(a, b, std::minus());

 }


 template <typename RetT, typename AT, typename BT, typename CT,

           typename BinaryOperation>

 inline constexpr RetT extend_sub_sat(AT a, BT b, CT c,

                                      BinaryOperation second_op) {

   return detail::extend_binary<RetT, true>(a, b, c, std::minus(), second_op);

 }


 template <typename RetT, typename AT, typename BT>

 inline constexpr RetT extend_absdiff(AT a, BT b) {

   return detail::extend_binary<RetT, false>(a, b, abs_diff());

 }


 template <typename RetT, typename AT, typename BT, typename CT,

           typename BinaryOperation>

 inline constexpr RetT extend_absdiff(AT a, BT b, CT c,

                                      BinaryOperation second_op) {

   return detail::extend_binary<RetT, false>(a, b, c, abs_diff(), second_op);

 }


 template <typename RetT, typename AT, typename BT>

 inline constexpr RetT extend_absdiff_sat(AT a, BT b) {

   return detail::extend_binary<RetT, true>(a, b, abs_diff());

 }


 template <typename RetT, typename AT, typename BT, typename CT,

           typename BinaryOperation>

 inline constexpr RetT extend_absdiff_sat(AT a, BT b, CT c,

                                          BinaryOperation second_op) {

   return detail::extend_binary<RetT, true>(a, b, c, abs_diff(), second_op);

 }


 template <typename RetT, typename AT, typename BT>

 inline constexpr RetT extend_min(AT a, BT b) {

   return detail::extend_binary<RetT, false>(a, b, minimum());

 }


 template <typename RetT, typename AT, typename BT, typename CT,

           typename BinaryOperation>

 inline constexpr RetT extend_min(AT a, BT b, CT c, BinaryOperation second_op) {

   return detail::extend_binary<RetT, false>(a, b, c, minimum(), second_op);

 }


 template <typename RetT, typename AT, typename BT>

 inline constexpr RetT extend_min_sat(AT a, BT b) {

   return detail::extend_binary<RetT, true>(a, b, minimum());

 }


 template <typename RetT, typename AT, typename BT, typename CT,

           typename BinaryOperation>

 inline constexpr RetT extend_min_sat(AT a, BT b, CT c,

                                      BinaryOperation second_op) {

   return detail::extend_binary<RetT, true>(a, b, c, minimum(), second_op);

 }


 template <typename RetT, typename AT, typename BT>

 inline constexpr RetT extend_max(AT a, BT b) {

   return detail::extend_binary<RetT, false>(a, b, maximum());

 }


 template <typename RetT, typename AT, typename BT, typename CT,

           typename BinaryOperation>

 inline constexpr RetT extend_max(AT a, BT b, CT c, BinaryOperation second_op) {

   return detail::extend_binary<RetT, false>(a, b, c, maximum(), second_op);

 }


 template <typename RetT, typename AT, typename BT>

 inline constexpr RetT extend_max_sat(AT a, BT b) {

   return detail::extend_binary<RetT, true>(a, b, maximum());

 }


 template <typename RetT, typename AT, typename BT, typename CT,

           typename BinaryOperation>

 inline constexpr RetT extend_max_sat(AT a, BT b, CT c,

                                      BinaryOperation second_op) {

   return detail::extend_binary<RetT, true>(a, b, c, maximum(), second_op);

 }


 } // namespace syclcompat

sycl::_V1::detail::half_impl::half
Definition: half_type.hpp:276

sycl::_V1::ext::oneapi::bfloat16
Definition: bfloat16.hpp:51

sycl::_V1::ext::oneapi::experimental::complex
Definition: common.hpp:28

sycl::marray
Provides a cross-platform math array class template that works on SYCL devices as well as in host C++...
Definition: marray.hpp:49

sycl::vec
class sycl::vec ///////////////////////// Provides a cross-patform vector class template that works e...
Definition: vector_preview.hpp:361

syclcompat::detail::vectorized_binary
Definition: math.hpp:71

syclcompat::detail::vectorized_binary::operator()
VecT operator()(VecT a, VecT b, const BinaryOperation binary_op)
Definition: math.hpp:73

complex.hpp

sycl::_V1::ext::intel::esimd::abs
__ESIMD_API std::enable_if_t< detail::is_esimd_scalar< T1 >::value, std::remove_const_t< T1 > > abs(T1 src0)
Get absolute value (scalar version).
Definition: math.hpp:166

sycl::_V1::detail::int64_t
conditional< sizeof(long)==8, long, long long >::type int64_t
Definition: kernel_desc.hpp:35

sycl::_V1::ext::intel::esimd::detail::sum
ESIMD_INLINE ESIMD_NODEBUG T0 sum(simd< T1, SZ > v)
Definition: math.hpp:1009

sycl::_V1::ext::intel::math::sqrt
std::enable_if_t< std::is_same_v< Tp, sycl::half2 >, sycl::half2 > sqrt(Tp x)
Definition: math.hpp:194

sycl::_V1::ext::oneapi::plus
std::plus< T > plus
Definition: functional.hpp:20

sycl::_V1::ext::oneapi::minimum
sycl::minimum< T > minimum
Definition: functional.hpp:26

sycl::_V1::ext::oneapi::maximum
sycl::maximum< T > maximum
Definition: functional.hpp:25

sycl::_V1::min
min
Definition: common_functions.cpp:63

sycl::_V1::hadd
return std::max(x, y) - std hadd
Definition: integer_functions.cpp:119

sycl::_V1::clamp
clamp
Definition: integer_functions.cpp:218

sycl::_V1::abs_diff
abs_diff
Definition: integer_functions.cpp:92

sycl::_V1::max
max
Definition: integer_functions.cpp:212

sycl::_V1::t
auto t
Definition: common_functions.cpp:57

syclcompat::detail::isnan
bool isnan(const ValueT a)
Definition: math.hpp:121

syclcompat::detail::clamp
ValueT clamp(ValueT val, ValueT min_val, ValueT max_val)
Definition: math.hpp:51

syclcompat::detail::complex_type
detail::complex_namespace::complex< ValueT > complex_type
Definition: math.hpp:48

syclcompat::detail::zero_or_signed_extent
int64_t zero_or_signed_extent(ValueT val, unsigned bit)
Extend the 'val' to 'bit' size, zero extend for unsigned int and signed extend for signed int.
Definition: math.hpp:85

syclcompat::detail::extend_binary
constexpr RetT extend_binary(AT a, BT b, BinaryOperation binary_op)
Definition: math.hpp:94

syclcompat
Definition: atomic.hpp:43

syclcompat::pow
float pow(const float a, const int b)
Definition: math.hpp:499

syclcompat::extend_absdiff_sat
constexpr RetT extend_absdiff_sat(AT a, BT b)
Extend a and b to 33 bit and do abs_diff with saturation.
Definition: math.hpp:856

syclcompat::min
sycl::half min(sycl::half a, sycl::half b)
Definition: math.hpp:441

syclcompat::extend_add
constexpr RetT extend_add(AT a, BT b)
Extend a and b to 33 bit and add them.
Definition: math.hpp:703

syclcompat::vectorized_max
T vectorized_max(T a, T b)
Compute vectorized max for two values, with each value treated as a vector type S.
Definition: math.hpp:301

syclcompat::compare
std::enable_if_t< std::is_same_v< std::invoke_result_t< BinaryOperation, ValueT, ValueT >, bool >, bool > compare(const ValueT a, const ValueT b, const BinaryOperation binary_op)
Performs comparison.
Definition: math.hpp:188

syclcompat::extend_sub
constexpr RetT extend_sub(AT a, BT b)
Extend a and b to 33 bit and minus them.
Definition: math.hpp:764

syclcompat::extend_max_sat
constexpr RetT extend_max_sat(AT a, BT b)
Extend a and b to 33 bit and return bigger one with saturation.
Definition: math.hpp:980

syclcompat::fast_length
float fast_length(const float *a, int len)
Compute fast_length for variable-length array.
Definition: math.hpp:136

syclcompat::extend_add_sat
constexpr RetT extend_add_sat(AT a, BT b)
Extend a and b to 33 bit and add them with saturation.
Definition: math.hpp:732

syclcompat::cabs
T cabs(sycl::vec< T, 2 > x)
Computes the magnitude of a complex number.
Definition: math.hpp:572

syclcompat::max
sycl::half max(sycl::half a, sycl::half b)
Definition: math.hpp:458

syclcompat::extend_min
constexpr RetT extend_min(AT a, BT b)
Extend a and b to 33 bit and return smaller one.
Definition: math.hpp:888

syclcompat::max
std::enable_if_t< std::is_integral_v< ValueT > &&std::is_integral_v< ValueU >, std::common_type_t< ValueT, ValueU > > max(ValueT a, ValueU b)
Definition: math.hpp:446

syclcompat::extend_max
constexpr RetT extend_max(AT a, BT b)
Extend a and b to 33 bit and return bigger one.
Definition: math.hpp:950

syclcompat::fmax_nan
std::common_type_t< ValueT, ValueU > fmax_nan(const ValueT a, const ValueU b)
Performs 2 elements comparison and returns the bigger one.
Definition: math.hpp:466

syclcompat::extend_absdiff
constexpr RetT extend_absdiff(AT a, BT b)
Extend a and b to 33 bit and do abs_diff.
Definition: math.hpp:825

syclcompat::extend_min_sat
constexpr RetT extend_min_sat(AT a, BT b)
Extend a and b to 33 bit and return smaller one with saturation.
Definition: math.hpp:918

syclcompat::conj
sycl::vec< T, 2 > conj(sycl::vec< T, 2 > x)
Computes the complex conjugate of a complex number.
Definition: math.hpp:581

syclcompat::min
std::enable_if_t< std::is_integral_v< ValueT > &&std::is_integral_v< ValueU >, std::common_type_t< ValueT, ValueU > > min(ValueT a, ValueU b)
Definition: math.hpp:429

syclcompat::relu
std::enable_if_t< std::is_floating_point_v< ValueT >||std::is_same_v< sycl::half, ValueT >, ValueT > relu(const ValueT a)
Performs relu saturation.
Definition: math.hpp:524

syclcompat::unordered_compare_both
std::enable_if_t< ValueT::size()==2, bool > unordered_compare_both(const ValueT a, const ValueT b, const BinaryOperation binary_op)
Performs 2 element unordered comparison and return true if both results are true.
Definition: math.hpp:257

syclcompat::cbrt
std::enable_if_t< std::is_floating_point_v< ValueT >||std::is_same_v< sycl::half, ValueT >, ValueT > cbrt(ValueT val)
cbrt function wrapper.
Definition: math.hpp:417

syclcompat::cdiv
sycl::vec< T, 2 > cdiv(sycl::vec< T, 2 > x, sycl::vec< T, 2 > y)
Computes the division of two complex numbers.
Definition: math.hpp:562

syclcompat::vectorized_min
T vectorized_min(T a, T b)
Compute vectorized min for two values, with each value treated as a vector type S.
Definition: math.hpp:317

syclcompat::fmin_nan
std::common_type_t< ValueT, ValueU > fmin_nan(const ValueT a, const ValueU b)
Performs 2 elements comparison and returns the smaller one.
Definition: math.hpp:485

syclcompat::cmul_add
sycl::vec< ValueT, 2 > cmul_add(const sycl::vec< ValueT, 2 > a, const sycl::vec< ValueT, 2 > b, const sycl::vec< ValueT, 2 > c)
Performs complex number multiply addition.
Definition: math.hpp:593

syclcompat::extend_sub_sat
constexpr RetT extend_sub_sat(AT a, BT b)
Extend a and b to 33 bit and minus them with saturation.
Definition: math.hpp:793

syclcompat::clamp
ValueT clamp(ValueT val, ValueT min_val, ValueT max_val)
Returns min(max(val, min_val), max_val)
Definition: math.hpp:400

syclcompat::compare_mask
unsigned compare_mask(const sycl::vec< ValueT, 2 > a, const sycl::vec< ValueT, 2 > b, const BinaryOperation binary_op)
Performs 2 elements comparison, compare result of each element is 0 (false) or 0xffff (true),...
Definition: math.hpp:271

syclcompat::length
ValueT length(const ValueT *a, const int len)
Calculate the square root of the input array.
Definition: math.hpp:161

syclcompat::unordered_compare_mask
unsigned unordered_compare_mask(const sycl::vec< ValueT, 2 > a, const sycl::vec< ValueT, 2 > b, const BinaryOperation binary_op)
Performs 2 elements unordered comparison, compare result of each element is 0 (false) or 0xffff (true...
Definition: math.hpp:287

syclcompat::compare_both
std::enable_if_t< ValueT::size()==2, bool > compare_both(const ValueT a, const ValueT b, const BinaryOperation binary_op)
Performs 2 element comparison and return true if both results are true.
Definition: math.hpp:245

syclcompat::vectorized_unary
unsigned vectorized_unary(unsigned a, const UnaryOperation unary_op)
Compute vectorized unary operation for a value, with the value treated as a vector type VecT.
Definition: math.hpp:333

syclcompat::vectorized_binary
unsigned vectorized_binary(unsigned a, unsigned b, const BinaryOperation binary_op)
Compute vectorized binary operation value for two values, with each value treated as a vector type Ve...
Definition: math.hpp:684

syclcompat::isnan
std::enable_if_t< ValueT::size()==2, ValueT > isnan(const ValueT a)
Determine whether 2 element value is NaN.
Definition: math.hpp:408

syclcompat::unordered_compare
std::enable_if_t< std::is_same_v< std::invoke_result_t< BinaryOperation, ValueT, ValueT >, bool >, bool > unordered_compare(const ValueT a, const ValueT b, const BinaryOperation binary_op)
Performs unordered comparison.
Definition: math.hpp:220

syclcompat::pow
std::enable_if_t<!std::is_floating_point_v< ValueT >, double > pow(const ValueT a, const ValueU b)
Definition: math.hpp:513

syclcompat::vectorized_sum_abs_diff
unsigned vectorized_sum_abs_diff(unsigned a, unsigned b)
Compute vectorized absolute difference for two values without modulo overflow, with each value treate...
Definition: math.hpp:348

syclcompat::vectorized_isgreater
T vectorized_isgreater(T a, T b)
Compute vectorized isgreater for two values, with each value treated as a vector type S.
Definition: math.hpp:367

syclcompat::cmul
sycl::vec< T, 2 > cmul(sycl::vec< T, 2 > x, sycl::vec< T, 2 > y)
Computes the multiplication of two complex numbers.
Definition: math.hpp:550

syclcompat::abs_diff
A sycl::abs_diff wrapper functors.
Definition: math.hpp:621

syclcompat::abs_diff::operator()
auto operator()(const ValueT x, const ValueT y) const
Definition: math.hpp:623

syclcompat::abs
A sycl::abs wrapper functors.
Definition: math.hpp:614

syclcompat::abs::operator()
auto operator()(const ValueT x) const
Definition: math.hpp:615

syclcompat::add_sat
A sycl::add_sat wrapper functors.
Definition: math.hpp:629

syclcompat::add_sat::operator()
auto operator()(const ValueT x, const ValueT y) const
Definition: math.hpp:631

syclcompat::hadd
A sycl::hadd wrapper functors.
Definition: math.hpp:645

syclcompat::hadd::operator()
auto operator()(const ValueT x, const ValueT y) const
Definition: math.hpp:647

syclcompat::maximum
A sycl::max wrapper functors.
Definition: math.hpp:653

syclcompat::maximum::operator()
auto operator()(const ValueT x, const ValueT y) const
Definition: math.hpp:655

syclcompat::minimum
A sycl::min wrapper functors.
Definition: math.hpp:661

syclcompat::minimum::operator()
auto operator()(const ValueT x, const ValueT y) const
Definition: math.hpp:663

syclcompat::rhadd
A sycl::rhadd wrapper functors.
Definition: math.hpp:637

syclcompat::rhadd::operator()
auto operator()(const ValueT x, const ValueT y) const
Definition: math.hpp:639

syclcompat::sub_sat
A sycl::sub_sat wrapper functors.
Definition: math.hpp:669

syclcompat::sub_sat::operator()
auto operator()(const ValueT x, const ValueT y) const
Definition: math.hpp:671

sycl.hpp