31template <gpu_arch arch_tag_>
39template <
typename tile_op_t_, gpu_arch arch_tag_>
51template <
typename dequant_op_t_,
typename tile_op_t_,
typename quant_op_t_,
52 gpu_arch arch_tag_,
typename dtype_dequant_ =
float>
64template <gpu_arch arch_tag_>
Definition limitation.hpp:607
gpu_arch
Definition common.hpp:73
Default epilogue policy for store C.
Definition epilogue_policy.hpp:32
static constexpr gpu_arch arch_tag
Definition epilogue_policy.hpp:33
Epilogue functor, specialized for quantization operator.
Definition epilogue_policy.hpp:53
quant_op_t_ quant_op_t
Definition epilogue_policy.hpp:56
dequant_op_t_ dequant_op_t
Definition epilogue_policy.hpp:54
static constexpr gpu_arch arch_tag
Definition epilogue_policy.hpp:57
dtype_dequant_ dtype_dequant
Definition epilogue_policy.hpp:58
tile_op_t_ tile_op_t
Definition epilogue_policy.hpp:55
Epilogue policy for tile_op + store C fusion.
Definition epilogue_policy.hpp:40
tile_op_t_ tile_op_t
Definition epilogue_policy.hpp:41
static constexpr gpu_arch arch_tag
Definition epilogue_policy.hpp:42
Epilogue policy for store unaligned C.
Definition epilogue_policy.hpp:65
static constexpr gpu_arch arch_tag
Definition epilogue_policy.hpp:66