XeTLA v0.3.6
IntelĀ® Xe Templates for Linear Algebra - API Definition Document
 
Loading...
Searching...
No Matches
misc.hpp File Reference

C++ API. More...

Include dependency graph for misc.hpp:
This graph shows which files directly or indirectly include this file:

Go to the source code of this file.

Namespaces

namespace  gpu
 
namespace  gpu::xetla
 

Functions

__XETLA_API constexpr uint32_t div_round_up (uint32_t n, uint32_t d)
 
__XETLA_API constexpr int div_round_down (int n, int d)
 
__XETLA_API constexpr int modulo (int n, int d)
 
__XETLA_API constexpr uint32_t cacheline_align_up (size_t size)
 
__XETLA_API xetla_vector< uint32_t, 4 > gpu::xetla::get_time_stamp ()
 Returns time stamp.
 
template<typename Ty , int N>
__XETLA_API xetla_vector< Ty, N > gpu::xetla::xetla_vector_gen (int InitVal, int Step)
 xetla_vector generation.
 
template<uint32_t N>
__XETLA_API xetla_mask_int< N > gpu::xetla::xetla_mask_int_gen (uint32_t mask_val)
 
template<typename dtype_acc , uint32_t N, uint32_t num_flag = 4, typename dtype_mask = uint8_t>
__XETLA_API xetla_vector< dtype_acc, N > gpu::xetla::drop_out (xetla_vector< dtype_acc, N > in, xetla_vector< dtype_mask, N > mask, dtype_acc scale)
 
template<reduce_op reduce_kind, typename dtype , int size>
__XETLA_API std::enable_if_t< reduce_kind==reduce_op::sum, xetla_vector< dtype, size > > gpu::xetla::reduce_helper (xetla_vector< dtype, size > a, xetla_vector< dtype, size > b)
 
template<reduce_op reduce_kind, typename dtype , int size>
__XETLA_API std::enable_if_t< reduce_kind==reduce_op::prod, xetla_vector< dtype, size > > gpu::xetla::reduce_helper (xetla_vector< dtype, size > a, xetla_vector< dtype, size > b)
 
template<reduce_op reduce_kind, typename dtype , int size>
__XETLA_API std::enable_if_t< reduce_kind==reduce_op::max, xetla_vector< dtype, size > > gpu::xetla::reduce_helper (xetla_vector< dtype, size > a, xetla_vector< dtype, size > b)
 
template<reduce_op reduce_kind, typename dtype , int size>
__XETLA_API std::enable_if_t< reduce_kind==reduce_op::min, xetla_vector< dtype, size > > gpu::xetla::reduce_helper (xetla_vector< dtype, size > a, xetla_vector< dtype, size > b)
 
template<reduce_op reduce_kind, typename dtype , int N_x, int N_y>
__XETLA_API std::enable_if_t< N_y==1, xetla_vector< dtype, N_x > > gpu::xetla::recur_row_reduce (xetla_vector< dtype, N_x > in)
 
template<reduce_op reduce_kind, typename dtype , int N_x, int N_y>
__XETLA_API std::enable_if_t<(N_y > 1), xetla_vector< dtype, N_x > > gpu::xetla::recur_row_reduce (xetla_vector< dtype, N_x *N_y > in)
 
template<reduce_op reduce_kind, typename dtype , int N_x, int N_y>
__XETLA_API std::enable_if_t< N_x==1, xetla_vector< dtype, N_y > > gpu::xetla::recur_col_reduce (xetla_vector< dtype, N_y > in)
 
template<reduce_op reduce_kind, typename dtype , int N_x, int N_y>
__XETLA_API std::enable_if_t<(N_x > 1), xetla_vector< dtype, N_y > > gpu::xetla::recur_col_reduce (xetla_vector< dtype, N_x *N_y > in)
 
__XETLA_API uint32_t gpu::xetla::get_2d_group_linear_id (sycl::nd_item< 3 > &item)
 get linear group id of the last two dimensions.
 

Detailed Description

C++ API.

Function Documentation

◆ cacheline_align_up()

__XETLA_API constexpr uint32_t cacheline_align_up ( size_t  size)
constexpr

◆ div_round_down()

__XETLA_API constexpr int div_round_down ( int  n,
int  d 
)
constexpr

◆ div_round_up()

__XETLA_API constexpr uint32_t div_round_up ( uint32_t  n,
uint32_t  d 
)
constexpr

◆ modulo()

__XETLA_API constexpr int modulo ( int  n,
int  d 
)
constexpr