|
| __XETLA_API xetla_vector< uint32_t, 4 > | gpu::xetla::get_time_stamp () |
| | Returns time stamp.
|
| |
| template<typename Ty , int N> |
| __XETLA_API xetla_vector< Ty, N > | gpu::xetla::xetla_vector_gen (int InitVal, int Step) |
| | xetla_vector generation.
|
| |
| template<uint32_t N> |
| __XETLA_API xetla_mask_int< N > | gpu::xetla::xetla_mask_int_gen (uint32_t mask_val) |
| |
| template<typename dtype_acc , uint32_t N, uint32_t num_flag = 4, typename dtype_mask = uint8_t> |
| __XETLA_API xetla_vector< dtype_acc, N > | gpu::xetla::drop_out (xetla_vector< dtype_acc, N > in, xetla_vector< dtype_mask, N > mask, dtype_acc scale) |
| |
| template<reduce_op reduce_kind, typename dtype , int size> |
| __XETLA_API std::enable_if_t< reduce_kind==reduce_op::sum, xetla_vector< dtype, size > > | gpu::xetla::reduce_helper (xetla_vector< dtype, size > a, xetla_vector< dtype, size > b) |
| |
| template<reduce_op reduce_kind, typename dtype , int N_x, int N_y> |
| __XETLA_API std::enable_if_t< N_y==1, xetla_vector< dtype, N_x > > | gpu::xetla::recur_row_reduce (xetla_vector< dtype, N_x > in) |
| |
| template<reduce_op reduce_kind, typename dtype , int N_x, int N_y> |
| __XETLA_API std::enable_if_t<(N_y > 1), xetla_vector< dtype, N_x > > | gpu::xetla::recur_row_reduce (xetla_vector< dtype, N_x *N_y > in) |
| |
| template<reduce_op reduce_kind, typename dtype , int N_x, int N_y> |
| __XETLA_API std::enable_if_t< N_x==1, xetla_vector< dtype, N_y > > | gpu::xetla::recur_col_reduce (xetla_vector< dtype, N_y > in) |
| |
| template<reduce_op reduce_kind, typename dtype , int N_x, int N_y> |
| __XETLA_API std::enable_if_t<(N_x > 1), xetla_vector< dtype, N_y > > | gpu::xetla::recur_col_reduce (xetla_vector< dtype, N_x *N_y > in) |
| |
| __XETLA_API uint32_t | gpu::xetla::get_2d_group_linear_id (sycl::nd_item< 3 > &item) |
| | get linear group id of the last two dimensions.
|
| |
Implements some useful and commonly used APIs, such as vector generation API.