|
| template<typename dtype > |
| constexpr gpu::xetla::argument_type | mma_argument_type () |
| | convert normal data type to dpas argument type
|
| |
| template<> |
| constexpr gpu::xetla::argument_type | mma_argument_type< tf32 > () |
| |
| template<> |
| constexpr gpu::xetla::argument_type | mma_argument_type< float > () |
| |
| template<> |
| constexpr gpu::xetla::argument_type | mma_argument_type< int8_t > () |
| |
| template<> |
| constexpr gpu::xetla::argument_type | mma_argument_type< uint8_t > () |
| |
| template<> |
| constexpr gpu::xetla::argument_type | mma_argument_type< bf16 > () |
| |
| template<> |
| constexpr gpu::xetla::argument_type | mma_argument_type< fp16 > () |
| |
| template<gpu::xetla::argument_type arg_type> |
| constexpr __ESIMD_NS::xmx::dpas_argument_type | get_argument_type () |
| | lookup table for dpas argument type
|
| |
| constexpr __ESIMD_ENS::cache_hint | get_cache_hint (gpu::xetla::cache_hint ch) |
| | lookup table for cache hint.
|
| |
| constexpr __ESIMD_ENS::lsc_data_size | get_data_size (gpu::xetla::data_size ds) |
| | lookup table for data size.
|
| |
| constexpr __ESIMD_ENS::lsc_memory_kind | get_memory_kind (gpu::xetla::memory_kind mk) |
| | lookup table for memory kind.
|
| |
| constexpr __ESIMD_ENS::lsc_fence_op | get_fence_op (gpu::xetla::fence_op fo) |
| | lookup table for fence op.
|
| |
| constexpr __ESIMD_ENS::lsc_scope | get_fence_scope (gpu::xetla::fence_scope fs) |
| | lookup table for fence scope.
|
| |
| constexpr __ESIMD_NS::atomic_op | get_atomic_op (gpu::xetla::atomic_op ao) |
| | lookup table for atomic op.
|
| |
| template<uint32_t element_size> |
| constexpr uint32_t | get_element_size_code () |
| | Get the element size code object.
|
| |
| template<lsc_action Action, cache_hint L1H, cache_hint L2H, gpu_arch arch_tag> |
| constexpr std::enable_if_t< arch_tag==gpu_arch::Xe, void > | check_lsc_cache_hint () |
| |
| template<cache_hint L1H, cache_hint L2H, gpu_arch arch_tag> |
| constexpr std::enable_if_t< arch_tag==gpu_arch::Xe, uint32_t > | get_load_cache_hint_code () |
| |
| template<cache_hint L1H, cache_hint L2H, gpu_arch arch_tag> |
| constexpr std::enable_if_t< arch_tag==gpu_arch::Xe, uint32_t > | get_prefetch_cache_hint_code () |
| |
| template<cache_hint L1H, cache_hint L2H, gpu_arch arch_tag> |
| constexpr std::enable_if_t< arch_tag==gpu_arch::Xe, uint32_t > | get_store_cache_hint_code () |
| |
| template<cache_hint L1H, cache_hint L2H, gpu_arch arch_tag> |
| constexpr std::enable_if_t< arch_tag==gpu_arch::Xe, uint32_t > | get_atomic_cache_hint_code () |
| |
| template<uint32_t num_channel> |
| constexpr uint32_t | get_execSize_code () |
| |
| template<atomic_op Op> |
| constexpr uint32_t | get_atomic_opcode () |
| |
| __XETLA_API void | xetla_set_tensor_base_address (xetla_tdescriptor_ref desc, uint64_t base_address) |
| |
| __XETLA_API void | xetla_set_tensor_base_address (xetla_tdescriptor_ref desc, uint32_t base_address) |
| |
| __XETLA_API uint64_t | xetla_get_tensor_base_address (xetla_tdescriptor desc) |
| |
| __XETLA_API void | xetla_set_tensor_width_x (xetla_tdescriptor_ref desc, uint32_t width_x) |
| |
| __XETLA_API uint32_t | xetla_get_tensor_width_x (xetla_tdescriptor desc) |
| |
| __XETLA_API void | xetla_set_tensor_width_y (xetla_tdescriptor_ref desc, uint32_t width_y) |
| |
| __XETLA_API uint32_t | xetla_get_tensor_width_y (xetla_tdescriptor desc) |
| |
| __XETLA_API void | xetla_set_tensor_pitch_x (xetla_tdescriptor_ref desc, uint32_t pitch_x) |
| |
| __XETLA_API uint32_t | xetla_get_tensor_pitch_x (xetla_tdescriptor desc) |
| |
| __XETLA_API void | xetla_set_tensor_offset_x (xetla_tdescriptor_ref desc, int32_t offset_x) |
| |
| __XETLA_API int32_t | xetla_get_tensor_offset_x (xetla_tdescriptor desc) |
| |
| __XETLA_API void | xetla_set_tensor_offset_y (xetla_tdescriptor_ref desc, int32_t offset_y) |
| |
| __XETLA_API int32_t | xetla_get_tensor_offset_y (xetla_tdescriptor desc) |
| |
| __XETLA_API void | xetla_set_block_widthx_widthy_arrlen (xetla_tdescriptor_ref desc, uint32_t block_widthx_widthy_arrlen) |
| |
| __XETLA_API uint8_t | xetla_get_block_width_x (xetla_tdescriptor desc) |
| |
| __XETLA_API uint8_t | xetla_get_block_width_y (xetla_tdescriptor desc) |
| |
| __XETLA_API uint8_t | xetla_get_block_array_len (xetla_tdescriptor desc) |
| |