XeTLA v0.3.6
IntelĀ® Xe Templates for Linear Algebra - API Definition Document
 
Loading...
Searching...
No Matches
common.hpp File Reference

C++ API. More...

#include "common/common.hpp"
Include dependency graph for common.hpp:
This graph shows which files directly or indirectly include this file:

Go to the source code of this file.

Classes

struct  gpu::xetla::subgroup::detail::NextPowerOf2< N, K, true >
 
struct  gpu::xetla::subgroup::detail::NextPowerOf2< N, K, false >
 
struct  gpu::xetla::subgroup::detail::gcd< a, b >
 
struct  gpu::xetla::subgroup::detail::gcd< a, 0 >
 
struct  gpu::xetla::subgroup::is_same_layout< T_dst, T_src >
 
struct  gpu::xetla::subgroup::is_floating_to_integer< T_dst, T_src >
 
struct  gpu::xetla::subgroup::msg_type_query< tile_desc_, memory_space, memory_layout >
 
struct  gpu::xetla::subgroup::get_load_block_size_auto< dtype, tile_size_x, tile_size_y, arch_tag, mem_layout_, reg_layout_ >
 
struct  gpu::xetla::subgroup::get_load_block_size_auto< dtype, tile_size_x, tile_size_y, gpu_arch::Xe, mem_layout::row_major, reg_layout::tiled >
 
struct  gpu::xetla::subgroup::get_store_block_size_auto< dtype, tile_size_x, tile_size_y, arch_tag, mem_layout_, reg_layout_ >
 
struct  gpu::xetla::subgroup::get_store_block_size_auto< dtype, tile_size_x, tile_size_y, gpu_arch::Xe, mem_layout::row_major, reg_layout::tiled >
 
struct  gpu::xetla::subgroup::global_atomic_oob_check_on_tag
 
struct  gpu::xetla::subgroup::global_atomic_oob_check_off_tag
 

Namespaces

namespace  gpu
 
namespace  gpu::xetla
 
namespace  gpu::xetla::subgroup
 
namespace  gpu::xetla::subgroup::detail
 

Enumerations

enum class  gpu::xetla::subgroup::detail::process_flag : uint8_t { gpu::xetla::subgroup::detail::load = 0 , gpu::xetla::subgroup::detail::store = 1 }
 

Functions

template<uint32_t N>
constexpr uint32_t gpu::xetla::subgroup::detail::getNextPowerOf2 ()
 Get the Next Power Of2 object.
 
template<>
constexpr uint32_t gpu::xetla::subgroup::detail::getNextPowerOf2< 0 > ()
 Get the Next Power Of2<0> object.
 
template<uint32_t remained_len, uint32_t base_len, process_flag flag, cache_hint L1, cache_hint L2, typename payload_t , typename tile_t >
__XETLA_API std::enable_if_t< base_len==0 > gpu::xetla::subgroup::detail::process_1d_tail (tile_t &tile, payload_t &payload, uint32_t offset)
 
template<uint32_t remained_len, uint32_t base_len, process_flag flag, cache_hint L1, cache_hint L2, typename payload_t , typename tile_t >
__XETLA_API std::enable_if_t< base_len !=0 &&payload_t::memory_space==mem_space::globalgpu::xetla::subgroup::detail::process_1d_tail (tile_t &tile, payload_t &payload, uint32_t offset)
 
template<uint32_t remained_len, uint32_t base_len, process_flag flag, cache_hint L1, cache_hint L2, typename payload_t , typename tile_t >
__XETLA_API std::enable_if_t< base_len !=0 &&payload_t::memory_space==mem_space::localgpu::xetla::subgroup::detail::process_1d_tail (tile_t &tile, payload_t &payload, uint32_t offset)
 
template<uint32_t remained_len, uint32_t base_len, cache_hint L1, cache_hint L2, typename payload_t >
__XETLA_API std::enable_if_t<(base_len< 8)> gpu::xetla::subgroup::detail::process_1d_tail (payload_t &payload, uint32_t offset)
 

Variables

__XETLA_API uint32_t gpu::xetla::subgroup::detail::size_x
 
__XETLA_API uint32_t uint32_t gpu::xetla::subgroup::detail::size_y
 
__XETLA_API uint32_t uint32_t uint32_t gpu::xetla::subgroup::detail::scale_factor
 
__XETLA_API uint32_t uint32_t uint32_t uint8_t gpu::xetla::subgroup::detail::arr_len
 
template<typename tile_desc_ , mem_space memory_space>
constexpr msg_type gpu::xetla::subgroup::msg_type_v = msg_type_query<tile_desc_, memory_space>::value
 

Detailed Description

C++ API.