35template <uint32_t wg_tile_n_, uint32_t wg_tile_m_, uint32_t sg_tile_n_,
36 uint32_t sg_tile_m_ = 1, uint32_t wg_num_m_ = 1, uint32_t wg_num_n_ = 1,
37 uint32_t chunk_size_ = 1>
43 static constexpr uint32_t
wg_num_m = wg_num_m_;
44 static constexpr uint32_t
wg_num_n = wg_num_n_;
48 "Currently, we don't see the value to set sg_tile_m > 1. Maybe it "
49 "can be used to save the L1 BW when load gamma/beta");
51 "Current design doesn't support cross workgroup sync. So, wg_num_n "
52 "should be 1, i.e. one entire row should be processed inside the "
55 "Current design we don't enable the boundary check");
57 "Current design we don't enable the boundary check on chunking "
Definition limitation.hpp:734
Sets up attribute of the layer norm.
Definition config.hpp:38
static constexpr uint32_t wg_num_n
Definition config.hpp:44
static constexpr uint32_t wg_tile_n
Definition config.hpp:40
static constexpr uint32_t sg_tile_m
Definition config.hpp:41
static constexpr uint32_t chunk_size
Definition config.hpp:45
static constexpr uint32_t wg_num_m
Definition config.hpp:43
static constexpr uint32_t sg_tile_n
Definition config.hpp:42
static constexpr uint32_t wg_tile_m
Definition config.hpp:39