XeTLA
v0.3.6
IntelĀ® Xe Templates for Linear Algebra - API Definition Document
Loading...
Searching...
No Matches
reduction_api.hpp
Go to the documentation of this file.
1
/*******************************************************************************
2
* Copyright (c) 2022-2023 Intel Corporation
3
*
4
* Licensed under the Apache License, Version 2.0 (the "License");
5
* you may not use this file except in compliance with the License.
6
* You may obtain a copy of the License at
7
*
8
* http://www.apache.org/licenses/LICENSE-2.0
9
*
10
* Unless required by applicable law or agreed to in writing, software
11
* distributed under the License is distributed on an "AS IS" BASIS,
12
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
* See the License for the specific language governing permissions and
14
* limitations under the License.
15
*******************************************************************************/
16
19
20
#pragma once
21
22
#include "subgroup/subgroup.hpp"
23
24
namespace
gpu::xetla::group
{
25
36
template
<
typename
dtype_acc,
typename
dtype_out, uint32_t row_size,
37
uint32_t wg_size_x, uint32_t wg_size_y, uint32_t max_simd_len = 32,
38
gpu_arch
arch_ =
gpu_arch::Xe
>
39
struct
group_row_reduce_store_t
{};
40
41
}
// namespace gpu::xetla::group
gpu::xetla::group
Definition
limitation.hpp:607
gpu::xetla::gpu_arch
gpu_arch
Definition
common.hpp:73
gpu::xetla::gpu_arch::Xe
@ Xe
gpu::xetla::group::group_row_reduce_store_t
This is the group row reduction(reduce_sum) + cooperative write out.
Definition
reduction_api.hpp:39
include
experimental
group
reduction
reduction_api.hpp
Generated by
1.9.7