XeTLA
v0.3.6
IntelĀ® Xe Templates for Linear Algebra - API Definition Document
Loading...
Searching...
No Matches
row_reduction_fused_op_api.hpp
Go to the documentation of this file.
1
/*******************************************************************************
2
* Copyright (c) 2022-2023 Intel Corporation
3
*
4
* Licensed under the Apache License, Version 2.0 (the "License");
5
* you may not use this file except in compliance with the License.
6
* You may obtain a copy of the License at
7
*
8
* http://www.apache.org/licenses/LICENSE-2.0
9
*
10
* Unless required by applicable law or agreed to in writing, software
11
* distributed under the License is distributed on an "AS IS" BASIS,
12
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
* See the License for the specific language governing permissions and
14
* limitations under the License.
15
*******************************************************************************/
16
19
20
#pragma once
21
22
#include "subgroup/subgroup.hpp"
23
24
namespace
gpu::xetla
{
25
28
enum class
reduction_fused_kind
: uint8_t {
29
none
= 0,
30
bias_gelu_w_bwd
= 1,
31
bias_dropout_bwd
= 2
32
};
33
34
namespace
group {
35
44
template
<
reduction_fused_kind
fused_op_kind_,
typename
dtype_in_,
45
typename
dtype_out_,
typename
dtype_acc_,
typename
reduction_attr_,
46
gpu_arch
arch_ =
gpu_arch::Xe
>
47
struct
row_reduction_fused_op_t
{};
48
49
}
// namespace group
50
}
// namespace gpu::xetla
gpu::xetla
Definition
arch_config.hpp:24
gpu::xetla::cache_hint::none
@ none
gpu::xetla::gpu_arch
gpu_arch
Definition
common.hpp:73
gpu::xetla::gpu_arch::Xe
@ Xe
gpu::xetla::reduction_fused_kind
reduction_fused_kind
Definition
row_reduction_fused_op_api.hpp:28
gpu::xetla::reduction_fused_kind::bias_gelu_w_bwd
@ bias_gelu_w_bwd
gpu::xetla::reduction_fused_kind::bias_dropout_bwd
@ bias_dropout_bwd
gpu::xetla::group::row_reduction_fused_op_t
Additional Ops that can be fused with row reduction processing flow.
Definition
row_reduction_fused_op_api.hpp:47
include
experimental
group
fused_op
row_reduction_fused_op_api.hpp
Generated by
1.9.7