|
static _tile1024i | tileloadd64_internal (short row, short col, char *buf, size_t stride) |
|
static _tile1024i | tdpbssd_internal (unsigned short m, unsigned short n, unsigned short k, _tile1024i dst, _tile1024i src1, _tile1024i src2) |
|
static _tile1024i | tdpbf16ps_internal (unsigned short m, unsigned short n, unsigned short k, _tile1024i dst, _tile1024i src1, _tile1024i src2) |
|
static void | tilestored64_internal (short row, short col, char *buf, size_t stride, _tile1024i tile) |
|
template<typename Group , typename T , size_t NumRows, size_t NumCols, matrix_layout Layout, access::address_space Space> |
__SYCL_ALWAYS_INLINE std::enable_if<(NumRows > tile_size)||(NumCols *sizeof(T)/4 > tile_size), void >::type | joint_matrix_load (Group sg, joint_matrix< Group, T, NumRows, NumCols, Layout > &jm, multi_ptr< T, Space > src, size_t stride, matrix_layout layout) |
|
template<typename Group , typename T , size_t NumRows, size_t NumCols, matrix_layout Layout, access::address_space Space> |
__SYCL_ALWAYS_INLINE std::enable_if<(NumRows<=tile_size) &&(NumCols *sizeof(T)/4<=tile_size), void >::type | joint_matrix_load (Group sg, joint_matrix< Group, T, NumRows, NumCols, Layout > &jm, multi_ptr< T, Space > src, size_t stride, matrix_layout layout) |
|
template<typename Group , typename T , size_t NumRows, size_t NumCols, matrix_layout Layout, access::address_space Space> |
__SYCL_ALWAYS_INLINE std::enable_if<(NumRows > tile_size)||(NumCols *sizeof(T)/4 > tile_size), void >::type | joint_matrix_store (Group sg, joint_matrix< Group, T, NumRows, NumCols, Layout > &jm, multi_ptr< T, Space > dst, size_t stride, matrix_layout layout) |
|
template<typename Group , typename T , size_t NumRows, size_t NumCols, matrix_layout Layout, access::address_space Space> |
__SYCL_ALWAYS_INLINE std::enable_if<(NumRows<=tile_size) &&(NumCols *sizeof(T)/4<=tile_size), void >::type | joint_matrix_store (Group sg, joint_matrix< Group, T, NumRows, NumCols, Layout > &jm, multi_ptr< T, Space > dst, size_t stride, matrix_layout layout) |
|
template<typename Group , typename T1 , typename T2 , size_t NumRowsA, size_t NumColsA, size_t NumRowsB, size_t NumColsB, size_t NumRowsC, size_t NumColsC, matrix_layout LayoutA, matrix_layout LayoutB, matrix_layout LayoutC> |
__SYCL_ALWAYS_INLINE std::enable_if<((std::is_same< T1, int8_t >::value &&std::is_same< T2, int32_t >::value)||(std::is_same< T1, unsigned short >::value &&std::is_same< T2, float >::value)) &&(LayoutA==matrix_layout::row_major) &&(LayoutB==matrix_layout::packed_b) &&(LayoutC==matrix_layout::row_major), joint_matrix< Group, T2, NumRowsC, NumColsC, LayoutC > >::type | joint_matrix_mad (Group sg, joint_matrix< Group, T1, NumRowsA, NumColsA, LayoutA > &jmA, joint_matrix< Group, T1, NumRowsB, NumColsB, LayoutB > &jmB, joint_matrix< Group, T2, NumRowsC, NumColsC, LayoutC > &jmC) |
|