xetla/math__mma_8hpp_source.html

/*******************************************************************************

* Copyright (c) 2022-2023 Intel Corporation

*

* Licensed under the Apache License, Version 2.0 (the "License");

* you may not use this file except in compliance with the License.

* You may obtain a copy of the License at

*

*     http://www.apache.org/licenses/LICENSE-2.0

*

* Unless required by applicable law or agreed to in writing, software

* distributed under the License is distributed on an "AS IS" BASIS,

* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

* See the License for the specific language governing permissions and

* limitations under the License.

*******************************************************************************/


#pragma once


#include "common/core/common.hpp"


#pragma clang diagnostic push

#pragma clang diagnostic ignored "-Wunused-parameter"


namespace gpu::xetla {

namespace detail {


template <typename dtype>

constexpr gpu::xetla::argument_type mma_argument_type() {

    return gpu::xetla::argument_type::U1;

}


template <>

constexpr gpu::xetla::argument_type mma_argument_type<tf32>() {

    return gpu::xetla::argument_type::TF32;

}


template <>

constexpr gpu::xetla::argument_type mma_argument_type<float>() {

    return gpu::xetla::argument_type::TF32;

}


template <>

constexpr gpu::xetla::argument_type mma_argument_type<int8_t>() {

    return gpu::xetla::argument_type::S8;

}


template <>

constexpr gpu::xetla::argument_type mma_argument_type<uint8_t>() {

    return gpu::xetla::argument_type::U8;

}


template <>

constexpr gpu::xetla::argument_type mma_argument_type<bf16>() {

    return gpu::xetla::argument_type::BF16;

}


template <>

constexpr gpu::xetla::argument_type mma_argument_type<fp16>() {

    return gpu::xetla::argument_type::FP16;

}


template <gpu::xetla::argument_type arg_type>

constexpr __ESIMD_NS::xmx::dpas_argument_type get_argument_type() {

    static_assert(arg_type == gpu::xetla::argument_type::U1

                    || arg_type == gpu::xetla::argument_type::S1

                    || arg_type == gpu::xetla::argument_type::U2

                    || arg_type == gpu::xetla::argument_type::S2

                    || arg_type == gpu::xetla::argument_type::U4

                    || arg_type == gpu::xetla::argument_type::S4

                    || arg_type == gpu::xetla::argument_type::U8

                    || arg_type == gpu::xetla::argument_type::S8

                    || arg_type == gpu::xetla::argument_type::FP16

                    || arg_type == gpu::xetla::argument_type::BF16

                    || arg_type == gpu::xetla::argument_type::TF32,

            "Unsupported argument type");

    switch (arg_type) {

        case gpu::xetla::argument_type::U1:

            return __ESIMD_NS::xmx::dpas_argument_type::u1;

        case gpu::xetla::argument_type::S1:

            return __ESIMD_NS::xmx::dpas_argument_type::s1;

        case gpu::xetla::argument_type::U2:

            return __ESIMD_NS::xmx::dpas_argument_type::u2;

        case gpu::xetla::argument_type::S2:

            return __ESIMD_NS::xmx::dpas_argument_type::s2;

        case gpu::xetla::argument_type::U4:

            return __ESIMD_NS::xmx::dpas_argument_type::u4;

        case gpu::xetla::argument_type::S4:

            return __ESIMD_NS::xmx::dpas_argument_type::s4;

        case gpu::xetla::argument_type::U8:

            return __ESIMD_NS::xmx::dpas_argument_type::u8;

        case gpu::xetla::argument_type::S8:

            return __ESIMD_NS::xmx::dpas_argument_type::s8;

        case gpu::xetla::argument_type::BF16:

            return __ESIMD_NS::xmx::dpas_argument_type::bf16;

        case gpu::xetla::argument_type::FP16:

            return __ESIMD_NS::xmx::dpas_argument_type::fp16;

        case gpu::xetla::argument_type::TF32:

            return __ESIMD_NS::xmx::dpas_argument_type::tf32;

        default:;

    }

}


} // namespace detail


template <argument_type src1_precision, argument_type src2_precision,

        int systolic_depth, int repeat_count, typename T, typename T1,

        typename T2, int N, int N1, int N2,

        typename Sat = xetla_saturation_off_tag>

__XETLA_API xetla_vector<T, N> xetla_mma(xetla_vector<T, N> src0,

        xetla_vector<T1, N1> src1, xetla_vector<T2, N2> src2, Sat sat = {}) {

    return __ESIMD_NS::xmx::dpas<systolic_depth, repeat_count, T, T, T1, T2,

            detail::get_argument_type<src1_precision>(),

            detail::get_argument_type<src2_precision>()>(src0, src1, src2);

}


} // namespace gpu::xetla

#pragma clang diagnostic pop

common.hpp
C++ API.

__XETLA_API
#define __XETLA_API
Definition common.hpp:43

gpu::xetla::xetla_vector
__ESIMD_NS::simd< native_type_t< Ty >, N > xetla_vector
wrapper for xetla_vector.
Definition base_types.hpp:149

gpu::xetla::xetla_mma
__XETLA_API xetla_vector< T, N > xetla_mma(xetla_vector< T, N > src0, xetla_vector< T1, N1 > src1, xetla_vector< T2, N2 > src2, Sat sat={})
description of xetla mma perform matrix multiply add operation
Definition math_mma.hpp:144

gpu::xetla::detail::mma_argument_type< uint8_t >
constexpr gpu::xetla::argument_type mma_argument_type< uint8_t >()
Definition math_mma.hpp:55

gpu::xetla::detail::mma_argument_type< int8_t >
constexpr gpu::xetla::argument_type mma_argument_type< int8_t >()
Definition math_mma.hpp:50

gpu::xetla::detail::mma_argument_type< tf32 >
constexpr gpu::xetla::argument_type mma_argument_type< tf32 >()
Definition math_mma.hpp:40

gpu::xetla::detail::mma_argument_type< fp16 >
constexpr gpu::xetla::argument_type mma_argument_type< fp16 >()
Definition math_mma.hpp:65

gpu::xetla::detail::mma_argument_type< float >
constexpr gpu::xetla::argument_type mma_argument_type< float >()
Definition math_mma.hpp:45

gpu::xetla::detail::mma_argument_type
constexpr gpu::xetla::argument_type mma_argument_type()
convert normal data type to dpas argument type
Definition math_mma.hpp:35

gpu::xetla::detail::mma_argument_type< bf16 >
constexpr gpu::xetla::argument_type mma_argument_type< bf16 >()
Definition math_mma.hpp:60

gpu::xetla::detail::get_argument_type
constexpr __ESIMD_NS::xmx::dpas_argument_type get_argument_type()
lookup table for dpas argument type
Definition math_mma.hpp:73

gpu::xetla
Definition arch_config.hpp:24

gpu::xetla::argument_type
argument_type
xetla dpas argument typ
Definition common.hpp:184

gpu::xetla::argument_type::U2
@ U2

gpu::xetla::argument_type::U8
@ U8

gpu::xetla::argument_type::S1
@ S1

gpu::xetla::argument_type::U4
@ U4

gpu::xetla::argument_type::TF32
@ TF32

gpu::xetla::argument_type::FP16
@ FP16

gpu::xetla::argument_type::S8
@ S8

gpu::xetla::argument_type::S2
@ S2

gpu::xetla::argument_type::S4
@ S4

gpu::xetla::argument_type::BF16
@ BF16

gpu::xetla::argument_type::U1
@ U1