|
template<typename RetType , typename Func , typename Arg > |
static Arg | cl::sycl::detail::member_ptr_helper (RetType(Func::*)(Arg) const) |
|
template<typename F , typename SuggestedArgType > |
SuggestedArgType | cl::sycl::detail::argument_helper (...) |
|
device | cl::sycl::detail::getDeviceFromHandler (handler &CommandGroupHandlerRef) |
|
template<int Dims, typename T > |
detail::enable_if_t< std::is_same< T, range< Dims > >::value||std::is_same< T, id< Dims > >::value > | cl::sycl::detail::checkValueRange (const T &V) |
|
template<int Dims> |
void | cl::sycl::detail::checkValueRange (const range< Dims > &R, const id< Dims > &O) |
|
template<int Dims, typename T > |
detail::enable_if_t< std::is_same< T, nd_range< Dims > >::value > | cl::sycl::detail::checkValueRange (const T &V) |
|
template<typename KernelName , typename KernelType , int Dims, class Reduction > |
void | cl::sycl::ext::oneapi::detail::reduCGFunc (handler &CGH, KernelType KernelFunc, const range< Dims > &Range, size_t MaxWGSize, uint32_t NumConcurrentWorkGroups, Reduction &Redu) |
|
template<typename KernelName , typename KernelType , int Dims, class Reduction > |
enable_if_t< Reduction::has_atomic_add_float64 > | cl::sycl::ext::oneapi::detail::reduCGFuncAtomic64 (handler &CGH, KernelType KernelFunc, const nd_range< Dims > &Range, Reduction &Redu) |
|
template<typename KernelName , typename KernelType , int Dims, class Reduction > |
enable_if_t< Reduction::has_fast_atomics > | cl::sycl::ext::oneapi::detail::reduCGFunc (handler &CGH, KernelType KernelFunc, const nd_range< Dims > &Range, Reduction &Redu) |
|
template<typename KernelName , typename KernelType , int Dims, class Reduction > |
enable_if_t<!Reduction::has_fast_atomics > | cl::sycl::ext::oneapi::detail::reduCGFunc (handler &CGH, KernelType KernelFunc, const nd_range< Dims > &Range, Reduction &Redu) |
|
template<typename KernelName , typename KernelType , class Reduction > |
enable_if_t<!Reduction::has_fast_atomics, size_t > | cl::sycl::ext::oneapi::detail::reduAuxCGFunc (handler &CGH, size_t NWorkItems, size_t MaxWGSize, Reduction &Redu) |
| Implements a command group function that enqueues a kernel that does one iteration of reduction of elements in each of work-groups. More...
|
|
template<typename KernelName , typename KernelType , int Dims, typename... Reductions, size_t... Is> |
void | cl::sycl::ext::oneapi::detail::reduCGFunc (handler &CGH, KernelType KernelFunc, const nd_range< Dims > &Range, std::tuple< Reductions... > &ReduTuple, std::index_sequence< Is... >) |
|
template<typename KernelName , typename KernelType , typename... Reductions, size_t... Is> |
size_t | cl::sycl::ext::oneapi::detail::reduAuxCGFunc (handler &CGH, size_t NWorkItems, size_t MaxWGSize, std::tuple< Reductions... > &ReduTuple, std::index_sequence< Is... >) |
|
template<typename KernelName , class Reduction > |
std::enable_if_t<!Reduction::is_usm > | cl::sycl::ext::oneapi::detail::reduSaveFinalResultToUserMem (handler &CGH, Reduction &Redu) |
| Copies the final reduction result kept in read-write accessor to user's accessor. More...
|
|
template<typename KernelName , class Reduction > |
std::enable_if_t< Reduction::is_usm > | cl::sycl::ext::oneapi::detail::reduSaveFinalResultToUserMem (handler &CGH, Reduction &Redu) |
| Copies the final reduction result kept in read-write accessor to user's USM memory. More...
|
|
template<typename... Reduction, size_t... Is> |
std::shared_ptr< event > | cl::sycl::ext::oneapi::detail::reduSaveFinalResultToUserMem (std::shared_ptr< detail::queue_impl > Queue, bool IsHost, std::tuple< Reduction... > &ReduTuple, std::index_sequence< Is... >) |
| Creates additional kernels that copy the accumulated/final results from reductions accessors to either user's accessor or user's USM memory. More...
|
|
template<typename Reduction , typename... RestT> |
std::enable_if_t<!Reduction::is_usm > | cl::sycl::ext::oneapi::detail::reduSaveFinalResultToUserMemHelper (std::vector< event > &Events, std::shared_ptr< detail::queue_impl > Queue, bool IsHost, Reduction &Redu, RestT... Rest) |
|
uint32_t | cl::sycl::ext::oneapi::detail::reduGetMaxNumConcurrentWorkGroups (std::shared_ptr< queue_impl > Queue) |
|
size_t | cl::sycl::ext::oneapi::detail::reduGetMaxWGSize (std::shared_ptr< queue_impl > Queue, size_t LocalMemBytesPerWorkItem) |
|
template<typename... ReductionT, size_t... Is> |
size_t | cl::sycl::ext::oneapi::detail::reduGetMemPerWorkItem (std::tuple< ReductionT... > &ReduTuple, std::index_sequence< Is... >) |
|
template<typename TupleT , std::size_t... Is> |
std::tuple< std::tuple_element_t< Is, TupleT >... > | cl::sycl::ext::oneapi::detail::tuple_select_elements (TupleT Tuple, std::index_sequence< Is... >) |
| Utility function: for the given tuple. More...
|
|