|
| template<uint32_t N> |
| constexpr uint32_t | gpu::xetla::subgroup::detail::getNextPowerOf2 () |
| | Get the Next Power Of2 object.
|
| |
| template<> |
| constexpr uint32_t | gpu::xetla::subgroup::detail::getNextPowerOf2< 0 > () |
| | Get the Next Power Of2<0> object.
|
| |
| template<uint32_t remained_len, uint32_t base_len, process_flag flag, cache_hint L1, cache_hint L2, typename payload_t , typename tile_t > |
| __XETLA_API std::enable_if_t< base_len==0 > | gpu::xetla::subgroup::detail::process_1d_tail (tile_t &tile, payload_t &payload, uint32_t offset) |
| |
| template<uint32_t remained_len, uint32_t base_len, process_flag flag, cache_hint L1, cache_hint L2, typename payload_t , typename tile_t > |
| __XETLA_API std::enable_if_t< base_len !=0 &&payload_t::memory_space==mem_space::global > | gpu::xetla::subgroup::detail::process_1d_tail (tile_t &tile, payload_t &payload, uint32_t offset) |
| |
| template<uint32_t remained_len, uint32_t base_len, process_flag flag, cache_hint L1, cache_hint L2, typename payload_t , typename tile_t > |
| __XETLA_API std::enable_if_t< base_len !=0 &&payload_t::memory_space==mem_space::local > | gpu::xetla::subgroup::detail::process_1d_tail (tile_t &tile, payload_t &payload, uint32_t offset) |
| |
| template<uint32_t remained_len, uint32_t base_len, cache_hint L1, cache_hint L2, typename payload_t > |
| __XETLA_API std::enable_if_t<(base_len< 8)> | gpu::xetla::subgroup::detail::process_1d_tail (payload_t &payload, uint32_t offset) |
| |