PI queue mapping on to CUstream objects. More...
#include <cuda/pi_cuda.hpp>
Classes | |
struct | CommandBatch |
struct | pi_queue_group_t |
Public Types | |
using | native_type = CUstream |
using | native_type = hipStream_t |
using | queue_type = _pi_device::queue_group_info_t::type |
typedef struct _pi_queue::CommandBatch | command_batch |
Static Public Attributes | |
static constexpr int | default_num_compute_streams = 128 |
static constexpr int | default_num_transfer_streams = 64 |
PI queue mapping on to CUstream objects.
PI queue mapping on to hipStream_t objects.
Definition at line 392 of file pi_cuda.hpp.
typedef struct _pi_queue::CommandBatch _pi_queue::command_batch |
using _pi_queue::native_type = hipStream_t |
Definition at line 372 of file pi_hip.hpp.
using _pi_queue::native_type = CUstream |
Definition at line 393 of file pi_cuda.hpp.
Definition at line 806 of file pi_level_zero.hpp.
|
inline |
Definition at line 424 of file pi_cuda.hpp.
Referenced by piextQueueCreateWithNativeHandle(), and piQueueCreate().
|
inline |
Definition at line 440 of file pi_cuda.hpp.
References context_, cuda_piContextRelease(), cuda_piDeviceRelease(), and device_.
|
inline |
Definition at line 109 of file pi_esimd_emulator.hpp.
|
inline |
Definition at line 381 of file pi_hip.hpp.
|
inline |
Definition at line 389 of file pi_hip.hpp.
References context_, device_, hip_piContextRelease(), and hip_piDeviceRelease().
_pi_queue::_pi_queue | ( | std::vector< ze_command_queue_handle_t > & | ComputeQueues, |
std::vector< ze_command_queue_handle_t > & | CopyQueues, | ||
pi_context | Context, | ||
pi_device | Device, | ||
bool | OwnZeCommandQueue, | ||
pi_queue_properties | Properties = 0 |
||
) |
Definition at line 1055 of file pi_level_zero.cpp.
References Context.
void _pi_queue::adjustBatchSizeForFullBatch | ( | bool | IsCopy | ) |
Definition at line 1316 of file pi_level_zero.cpp.
References ComputeCommandBatch, CopyCommandBatch, CommandListBatchConfig::dynamic(), CommandListBatchConfig::DynamicSizeMax, CommandListBatchConfig::DynamicSizeStep, _pi_queue::CommandBatch::NumTimesClosedEarly, CommandListBatchConfig::NumTimesClosedEarlyThreshold, _pi_queue::CommandBatch::NumTimesClosedFull, CommandListBatchConfig::NumTimesClosedFullThreshold, _pi_queue::CommandBatch::QueueBatchSize, ZeCommandListBatchComputeConfig, ZeCommandListBatchConfig(), and ZeCommandListBatchCopyConfig.
Referenced by executeCommandList().
void _pi_queue::adjustBatchSizeForPartialBatch | ( | bool | IsCopy | ) |
Definition at line 1343 of file pi_level_zero.cpp.
References ComputeCommandBatch, CopyCommandBatch, CommandListBatchConfig::dynamic(), _pi_queue::CommandBatch::NumTimesClosedEarly, _pi_queue::CommandBatch::NumTimesClosedFull, _pi_queue::CommandBatch::OpenCommandList, _pi_queue::CommandBatch::QueueBatchSize, ZeCommandListBatchComputeConfig, ZeCommandListBatchConfig(), and ZeCommandListBatchCopyConfig.
Referenced by executeOpenCommandList().
|
inlinenoexcept |
Definition at line 583 of file pi_cuda.hpp.
References has_ownership_.
Referenced by cuda_piQueueRelease().
|
inline |
Definition at line 466 of file pi_cuda.hpp.
References compute_stream_idx_, compute_streams_, has_been_synchronized(), and max().
Referenced by get_next_compute_stream().
void _pi_queue::CaptureIndirectAccesses | ( | ) |
Definition at line 1369 of file pi_level_zero.cpp.
References _pi_platform::Contexts, Device, KernelsToBeSubmitted, and _pi_device::Platform.
Referenced by executeCommandList(), and piEnqueueKernelLaunch().
|
inlinenoexcept |
Definition at line 400 of file pi_hip.hpp.
References refCount_.
|
inlinenoexcept |
Definition at line 577 of file pi_cuda.hpp.
References refCount_.
Referenced by cuda_piQueueRelease(), and hip_piQueueRelease().
pi_command_list_ptr_t _pi_queue::eventOpenCommandList | ( | pi_event | Event | ) |
Definition at line 1675 of file pi_level_zero.cpp.
References CommandListMap, ComputeCommandBatch, CopyCommandBatch, hasOpenCommandList(), and _pi_queue::CommandBatch::OpenCommandList.
Referenced by _pi_ze_event_list_t::createAndRetainPiZeEventList().
|
inline |
Definition at line 996 of file pi_level_zero.hpp.
Referenced by _pi_ze_event_list_t::createAndRetainPiZeEventList(), piQueueFinish(), and piQueueRelease().
pi_result _pi_queue::executeCommandList | ( | pi_command_list_ptr_t | CommandList, |
bool | IsBlocking = false , |
||
bool | OKToBatchCommand = false |
||
) |
Definition at line 1393 of file pi_level_zero.cpp.
References adjustBatchSizeForFullBatch(), CaptureIndirectAccesses(), _pi_event::CleanedUp, CommandListMap, ComputeCommandBatch, _pi_platform::ContextsMutex, CopyCommandBatch, createEventAndAssociateQueue(), Device, cl::sycl::detail::pi::die(), CommandListBatchConfig::dynamic(), hasOpenCommandList(), Healthy, isBatchingAllowed(), LastCommandEvent, _pi_queue::CommandBatch::OpenCommandList, PI_CALL, PI_COMMAND_TYPE_USER, piEventRelease(), piEventRetain(), _pi_device::Platform, PrintPiTrace, _pi_queue::CommandBatch::QueueBatchSize, synchronize(), ZE_CALL, ZE_CALL_NOCHECK, ZeCommandListBatchComputeConfig, ZeCommandListBatchConfig(), ZeCommandListBatchCopyConfig, and _pi_event::ZeEvent.
Referenced by enqueueMemCopyHelper(), enqueueMemCopyRectHelper(), enqueueMemFillHelper(), enqueueMemImageCommandHelper(), executeOpenCommandList(), piEnqueueEventsWait(), piEnqueueEventsWaitWithBarrier(), piEnqueueKernelLaunch(), piEnqueueMemBufferMap(), piEnqueueMemUnmap(), piextUSMEnqueueMemAdvise(), and piextUSMEnqueuePrefetch().
pi_result _pi_queue::executeOpenCommandList | ( | bool | IsCopy | ) |
Definition at line 1700 of file pi_level_zero.cpp.
References adjustBatchSizeForPartialBatch(), CommandListMap, ComputeCommandBatch, CopyCommandBatch, executeCommandList(), hasOpenCommandList(), and _pi_queue::CommandBatch::OpenCommandList.
Referenced by _pi_ze_event_list_t::createAndRetainPiZeEventList(), and _pi_context::getAvailableCommandList().
|
inline |
Definition at line 488 of file pi_cuda.hpp.
References compute_stream_mutex_, compute_streams_, num_compute_streams_, num_transfer_streams_, transfer_stream_mutex_, and transfer_streams_.
Referenced by cuda_piQueueRelease().
|
inline |
Definition at line 456 of file pi_cuda.hpp.
References get_next_compute_stream().
Referenced by hip_piEnqueueKernelLaunch(), hip_piEnqueueMemBufferCopy(), hip_piEnqueueMemBufferCopyRect(), hip_piEnqueueMemBufferFill(), hip_piEnqueueMemBufferRead(), hip_piEnqueueMemBufferReadRect(), hip_piEnqueueMemBufferWrite(), hip_piEnqueueMemBufferWriteRect(), hip_piEnqueueMemImageCopy(), hip_piEnqueueMemImageRead(), and hip_piEnqueueMemImageWrite().
|
inlinenoexcept |
Definition at line 394 of file pi_hip.hpp.
References stream_.
|
inline |
Definition at line 396 of file pi_hip.hpp.
References context_.
|
inline |
Definition at line 571 of file pi_cuda.hpp.
References context_.
Referenced by cuda_piEnqueueEventsWaitWithBarrier(), cuda_piEnqueueKernelLaunch(), cuda_piEnqueueMemBufferCopy(), cuda_piEnqueueMemBufferCopyRect(), cuda_piEnqueueMemBufferFill(), cuda_piEnqueueMemBufferMap(), cuda_piEnqueueMemBufferRead(), cuda_piEnqueueMemBufferReadRect(), cuda_piEnqueueMemBufferWrite(), cuda_piEnqueueMemBufferWriteRect(), cuda_piEnqueueMemImageCopy(), cuda_piEnqueueMemImageRead(), cuda_piEnqueueMemImageWrite(), cuda_piEnqueueMemUnmap(), cuda_piQueueFinish(), cuda_piQueueRelease(), hip_piEnqueueEventsWaitWithBarrier(), hip_piEnqueueKernelLaunch(), hip_piEnqueueMemBufferCopy(), hip_piEnqueueMemBufferCopyRect(), hip_piEnqueueMemBufferFill(), hip_piEnqueueMemBufferMap(), hip_piEnqueueMemBufferRead(), hip_piEnqueueMemBufferReadRect(), hip_piEnqueueMemBufferWrite(), hip_piEnqueueMemBufferWriteRect(), hip_piEnqueueMemImageCopy(), hip_piEnqueueMemImageRead(), hip_piEnqueueMemImageWrite(), hip_piEnqueueMemUnmap(), hip_piQueueFinish(), and hip_piQueueRelease().
|
inline |
Definition at line 573 of file pi_cuda.hpp.
References device_.
Referenced by cuda_piEnqueueKernelLaunch().
Definition at line 380 of file pi_cuda.cpp.
References compute_stream_idx_, compute_stream_mutex_, compute_streams_, delay_compute_, flags_, and num_compute_streams_.
Referenced by cuda_piEnqueueEventsWaitWithBarrier(), cuda_piEnqueueKernelLaunch(), get(), get_next_compute_stream(), and get_next_transfer_stream().
CUstream _pi_queue::get_next_compute_stream | ( | pi_uint32 | num_events_in_wait_list, |
const pi_event * | event_wait_list, | ||
_pi_stream_guard & | guard, | ||
pi_uint32 * | stream_token = nullptr |
||
) |
Definition at line 409 of file pi_cuda.cpp.
References can_reuse_stream(), compute_stream_sync_mutex_, delay_compute_, get_next_compute_stream(), _pi_event::get_stream(), and _pi_event::get_stream_token().
|
inlinenoexcept |
Definition at line 404 of file pi_hip.hpp.
References eventCount_.
|
inlinenoexcept |
Definition at line 581 of file pi_cuda.hpp.
References eventCount_.
Referenced by _pi_event::record().
CUstream _pi_queue::get_next_transfer_stream | ( | ) |
Definition at line 434 of file pi_cuda.cpp.
References flags_, get_next_compute_stream(), num_transfer_streams_, transfer_stream_idx_, transfer_stream_mutex_, and transfer_streams_.
Referenced by cuda_piEnqueueMemBufferCopy(), cuda_piEnqueueMemBufferCopyRect(), cuda_piEnqueueMemBufferFill(), cuda_piEnqueueMemBufferMap(), cuda_piEnqueueMemBufferRead(), cuda_piEnqueueMemBufferReadRect(), cuda_piEnqueueMemBufferWrite(), cuda_piEnqueueMemBufferWriteRect(), cuda_piEnqueueMemImageCopy(), cuda_piEnqueueMemImageRead(), cuda_piEnqueueMemImageWrite(), and cuda_piEnqueueMemUnmap().
|
inlinenoexcept |
Definition at line 402 of file pi_hip.hpp.
References refCount_.
|
inlinenoexcept |
Definition at line 579 of file pi_cuda.hpp.
References refCount_.
Referenced by cuda_piQueueGetInfo(), cuda_piQueueRetain(), hip_piQueueGetInfo(), and hip_piQueueRetain().
|
inline |
Definition at line 859 of file pi_level_zero.hpp.
Referenced by _pi_context::getAvailableCommandList().
|
inline |
Definition at line 458 of file pi_cuda.hpp.
References last_sync_compute_streams_, and max().
Referenced by can_reuse_stream().
|
inline |
Definition at line 964 of file pi_level_zero.hpp.
References _pi_queue::CommandBatch::OpenCommandList.
Referenced by eventOpenCommandList(), executeCommandList(), executeOpenCommandList(), and _pi_context::getAvailableCommandList().
|
inlinenoexcept |
Definition at line 398 of file pi_hip.hpp.
References refCount_.
|
inlinenoexcept |
Definition at line 575 of file pi_cuda.hpp.
References refCount_.
Referenced by cuda_piQueueRetain(), and hip_piQueueRetain().
bool _pi_queue::isBatchingAllowed | ( | bool | IsCopy | ) | const |
Definition at line 1551 of file pi_level_zero.cpp.
References ComputeCommandBatch, CopyCommandBatch, and _pi_queue::CommandBatch::QueueBatchSize.
Referenced by executeCommandList().
bool _pi_queue::isInOrderQueue | ( | ) | const |
Definition at line 888 of file pi_level_zero.cpp.
References PI_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE, and Properties.
Referenced by _pi_ze_event_list_t::createAndRetainPiZeEventList(), piEnqueueMemBufferMap(), piEnqueueMemUnmap(), and useCopyEngine().
pi_result _pi_queue::resetCommandList | ( | pi_command_list_ptr_t | CommandList, |
bool | MakeAvailable, | ||
std::vector< _pi_event * > & | EventListToCleanup | ||
) |
Definition at line 894 of file pi_level_zero.cpp.
References Context, Device, ZE_CALL, _pi_context::ZeCommandListCacheMutex, _pi_context::ZeComputeCommandListCache, _pi_context::ZeCopyCommandListCache, and _pi_device::ZeDevice.
Referenced by _pi_context::getAvailableCommandList(), piQueueRelease(), and resetCommandLists().
|
inline |
Definition at line 509 of file pi_cuda.hpp.
References compute_stream_idx_, compute_stream_mutex_, compute_stream_sync_mutex_, compute_streams_, delay_compute_, last_sync_compute_streams_, last_sync_transfer_streams_, num_compute_streams_, num_transfer_streams_, transfer_stream_idx_, transfer_stream_mutex_, and transfer_streams_.
Referenced by cuda_piQueueFinish().
pi_result _pi_queue::synchronize | ( | ) |
Definition at line 6105 of file pi_level_zero.cpp.
References CommandListMap, _pi_event::Completed, ComputeQueueGroup, Context, CopyQueueGroup, EventCreate(), Healthy, _pi_queue::pi_queue_group_t::ImmCmdLists, PI_CALL, piEventRelease(), ZE_CALL, _pi_event::ZeEvent, and _pi_queue::pi_queue_group_t::ZeQueues.
Referenced by executeCommandList(), piEnqueueEventsWait(), piQueueFinish(), and piQueueRelease().
bool _pi_queue::useCopyEngine | ( | bool | PreferCopyEngine = true | ) | const |
Definition at line 6091 of file pi_level_zero.cpp.
References CopyQueueGroup, isInOrderQueue(), and _pi_queue::pi_queue_group_t::ZeQueues.
Referenced by enqueueMemCopyHelper(), enqueueMemCopyRectHelper(), enqueueMemFillHelper(), and enqueueMemImageCommandHelper().
cm_support::CmQueue* _pi_queue::CmQueuePtr = nullptr |
Definition at line 114 of file pi_esimd_emulator.hpp.
Referenced by piQueueRelease().
pi_command_list_map_t _pi_queue::CommandListMap |
Definition at line 900 of file pi_level_zero.hpp.
Referenced by _pi_ze_event_list_t::createAndRetainPiZeEventList(), createEventAndAssociateQueue(), eventOpenCommandList(), executeCommandList(), executeOpenCommandList(), _pi_context::getAvailableCommandList(), piEnqueueEventsWait(), piEnqueueMemBufferMap(), piEnqueueMemUnmap(), piQueueRelease(), resetCommandLists(), and synchronize().
std::atomic_uint32_t _pi_queue::compute_stream_idx_ |
Definition at line 409 of file pi_cuda.hpp.
Referenced by can_reuse_stream(), get_next_compute_stream(), and sync_streams().
std::mutex _pi_queue::compute_stream_mutex_ |
Definition at line 420 of file pi_cuda.hpp.
Referenced by for_each_stream(), get_next_compute_stream(), and sync_streams().
std::mutex _pi_queue::compute_stream_sync_mutex_ |
Definition at line 419 of file pi_cuda.hpp.
Referenced by get_next_compute_stream(), and sync_streams().
std::vector<native_type> _pi_queue::compute_streams_ |
Definition at line 397 of file pi_cuda.hpp.
Referenced by can_reuse_stream(), for_each_stream(), get_next_compute_stream(), and sync_streams().
command_batch _pi_queue::ComputeCommandBatch |
Definition at line 925 of file pi_level_zero.hpp.
Referenced by adjustBatchSizeForFullBatch(), adjustBatchSizeForPartialBatch(), eventOpenCommandList(), executeCommandList(), executeOpenCommandList(), _pi_context::getAvailableCommandList(), isBatchingAllowed(), and piQueueReleaseInternal().
pi_queue_group_t _pi_queue::ComputeQueueGroup {this, queue_type::Compute} |
Definition at line 849 of file pi_level_zero.hpp.
Referenced by piextQueueGetNativeHandle(), piQueueFinish(), piQueueReleaseInternal(), and synchronize().
pi_context _pi_queue::Context = nullptr |
Definition at line 113 of file pi_esimd_emulator.hpp.
Referenced by _pi_queue(), USMSharedMemoryAlloc::allocateImpl(), USMSharedReadOnlyMemoryAlloc::allocateImpl(), USMDeviceMemoryAlloc::allocateImpl(), USMHostMemoryAlloc::allocateImpl(), ContextReleaseHelper(), createEventAndAssociateQueue(), USMMemoryAllocBase::deallocate(), enqueueMemCopyHelper(), enqueueMemCopyRectHelper(), enqueueMemFillHelper(), enqueueMemImageCommandHelper(), EventCreate(), _pi_buffer::free(), _pi_context::getAvailableCommandList(), _pi_buffer::getZeHandle(), IsDevicePointer(), piclProgramCreateWithSource(), piContextGetInfo(), piContextRelease(), piContextRetain(), piEnqueueEventsWait(), piEnqueueEventsWaitWithBarrier(), piEnqueueKernelLaunch(), piEnqueueMemBufferMap(), piEnqueueMemUnmap(), piEventCreate(), piEventRelease(), piextContextGetNativeHandle(), piextContextSetExtendedDeleter(), piextEventCreateWithNativeHandle(), piextKernelCreateWithNativeHandle(), piextMemCreateWithNativeHandle(), piextProgramCreateWithNativeHandle(), piextQueueCreateWithNativeHandle(), piextUSMDeviceAlloc(), piextUSMEnqueueMemAdvise(), piextUSMEnqueueMemcpy(), piextUSMEnqueuePrefetch(), piextUSMFree(), piextUSMGetMemAllocInfo(), piextUSMHostAlloc(), piextUSMSharedAlloc(), piMemBufferCreate(), piMemImageCreate(), piProgramCreate(), piProgramCreateWithBinary(), piProgramLink(), piQueueCreate(), piQueueGetInfo(), piSamplerCreate(), resetCommandList(), synchronize(), USMDeviceAllocImpl(), USMFreeHelper(), USMFreeImpl(), USMHostAllocImpl(), USMSharedAllocImpl(), ZeDeviceMemAllocHelper(), ZeHostMemAllocHelper(), and ZeMemFreeHelper().
const pi_context _pi_queue::Context |
Definition at line 871 of file pi_level_zero.hpp.
_pi_context * _pi_queue::context_ |
Definition at line 404 of file pi_cuda.hpp.
Referenced by cuda_piQueueGetInfo(), get_context(), hip_piQueueGetInfo(), and ~_pi_queue().
command_batch _pi_queue::CopyCommandBatch |
Definition at line 925 of file pi_level_zero.hpp.
Referenced by adjustBatchSizeForFullBatch(), adjustBatchSizeForPartialBatch(), eventOpenCommandList(), executeCommandList(), executeOpenCommandList(), _pi_context::getAvailableCommandList(), isBatchingAllowed(), and piQueueReleaseInternal().
pi_queue_group_t _pi_queue::CopyQueueGroup {this, queue_type::MainCopy} |
Definition at line 854 of file pi_level_zero.hpp.
Referenced by piQueueFinish(), piQueueReleaseInternal(), synchronize(), and useCopyEngine().
|
staticconstexpr |
Definition at line 394 of file pi_cuda.hpp.
Referenced by cuda_piQueueCreate().
|
staticconstexpr |
Definition at line 395 of file pi_cuda.hpp.
Referenced by cuda_piQueueCreate().
std::vector<bool> _pi_queue::delay_compute_ |
Definition at line 403 of file pi_cuda.hpp.
Referenced by get_next_compute_stream(), and sync_streams().
const pi_device _pi_queue::Device |
Definition at line 876 of file pi_level_zero.hpp.
Referenced by USMSharedMemoryAlloc::allocateImpl(), USMSharedReadOnlyMemoryAlloc::allocateImpl(), USMDeviceMemoryAlloc::allocateImpl(), CaptureIndirectAccesses(), enqueueMemFillHelper(), enqueueMemImageCommandHelper(), executeCommandList(), _pi_context::getAvailableCommandList(), _pi_queue::pi_queue_group_t::getQueueIndex(), _pi_buffer::getZeHandle(), _pi_buffer::getZeHandlePtr(), pi_command_list_info_t::isCopy(), piDeviceGetInfo(), piDevicePartition(), piDeviceRelease(), piDeviceRetain(), piEnqueueKernelLaunch(), piEnqueueMemBufferCopy(), piEnqueueMemBufferCopyRect(), piEnqueueMemBufferFill(), piEnqueueMemBufferMap(), piEnqueueMemBufferRead(), piEnqueueMemBufferReadRect(), piEnqueueMemBufferWrite(), piEnqueueMemBufferWriteRect(), piEnqueueMemUnmap(), piEventGetProfilingInfo(), piextDeviceCreateWithNativeHandle(), piextDeviceGetNativeHandle(), piextDeviceSelectBinary(), piextGetDeviceFunctionPointer(), piextMemCreateWithNativeHandle(), piextQueueCreateWithNativeHandle(), piextUSMDeviceAlloc(), piextUSMEnqueueMemAdvise(), piextUSMGetMemAllocInfo(), piextUSMSharedAlloc(), piKernelGetGroupInfo(), piKernelGetSubGroupInfo(), piMemImageCreate(), piProgramGetBuildInfo(), piQueueCreate(), piQueueGetInfo(), piSamplerCreate(), resetCommandList(), USMDeviceAllocImpl(), USMFreeHelper(), USMSharedAllocImpl(), and ZeDeviceMemAllocHelper().
_pi_device * _pi_queue::device_ |
Definition at line 405 of file pi_cuda.hpp.
Referenced by cuda_piEnqueueKernelLaunch(), cuda_piQueueGetInfo(), get_device(), hip_piEnqueueKernelLaunch(), hip_piQueueGetInfo(), and ~_pi_queue().
std::atomic_uint32_t _pi_queue::eventCount_ |
Definition at line 408 of file pi_cuda.hpp.
Referenced by get_next_event_id().
unsigned int _pi_queue::flags_ |
Definition at line 415 of file pi_cuda.hpp.
Referenced by get_next_compute_stream(), and get_next_transfer_stream().
bool _pi_queue::has_ownership_ |
Definition at line 422 of file pi_cuda.hpp.
Referenced by backend_has_ownership().
bool _pi_queue::Healthy {true} |
Definition at line 1018 of file pi_level_zero.hpp.
Referenced by executeCommandList(), piQueueRelease(), and synchronize().
std::vector<pi_kernel> _pi_queue::KernelsToBeSubmitted |
Definition at line 890 of file pi_level_zero.hpp.
Referenced by CaptureIndirectAccesses(), and piEnqueueKernelLaunch().
unsigned int _pi_queue::last_sync_compute_streams_ |
Definition at line 413 of file pi_cuda.hpp.
Referenced by has_been_synchronized(), and sync_streams().
unsigned int _pi_queue::last_sync_transfer_streams_ |
Definition at line 414 of file pi_cuda.hpp.
Referenced by sync_streams().
pi_event _pi_queue::LastCommandEvent = nullptr |
Definition at line 882 of file pi_level_zero.hpp.
Referenced by CleanupCompletedEvent(), _pi_ze_event_list_t::createAndRetainPiZeEventList(), executeCommandList(), piEnqueueEventsWait(), piEnqueueMemBufferMap(), piEnqueueMemUnmap(), and piQueueFinish().
unsigned int _pi_queue::num_compute_streams_ |
Definition at line 411 of file pi_cuda.hpp.
Referenced by for_each_stream(), get_next_compute_stream(), and sync_streams().
unsigned int _pi_queue::num_transfer_streams_ |
Definition at line 412 of file pi_cuda.hpp.
Referenced by for_each_stream(), get_next_transfer_stream(), and sync_streams().
bool _pi_queue::OwnZeCommandQueue |
Definition at line 897 of file pi_level_zero.hpp.
Referenced by piQueueReleaseInternal().
pi_queue_properties _pi_queue::Properties |
Definition at line 934 of file pi_level_zero.hpp.
Referenced by EventCreate(), _pi_kernel::initialize(), isInOrderQueue(), piContextCreate(), piDevicePartition(), piEventGetProfilingInfo(), piextUSMDeviceAlloc(), piextUSMHostAlloc(), piextUSMSharedAlloc(), piQueueCreate(), USMDeviceAllocImpl(), USMHostAllocImpl(), and USMSharedAllocImpl().
pi_queue_properties _pi_queue::properties_ |
Definition at line 406 of file pi_cuda.hpp.
Referenced by cuda_piQueueGetInfo(), hip_piQueueGetInfo(), _pi_event::release(), and _pi_event::start().
std::atomic_uint32_t _pi_queue::refCount_ |
Definition at line 407 of file pi_cuda.hpp.
Referenced by decrement_reference_count(), get_reference_count(), and increment_reference_count().
pi_uint32 _pi_queue::RefCountExternal {1} |
Definition at line 1015 of file pi_level_zero.hpp.
Referenced by piQueueRelease(), and piQueueRetain().
native_type _pi_queue::stream_ |
Definition at line 374 of file pi_hip.hpp.
Referenced by get(), and hip_piQueueFinish().
std::atomic_uint32_t _pi_queue::transfer_stream_idx_ |
Definition at line 410 of file pi_cuda.hpp.
Referenced by get_next_transfer_stream(), and sync_streams().
std::mutex _pi_queue::transfer_stream_mutex_ |
Definition at line 421 of file pi_cuda.hpp.
Referenced by for_each_stream(), get_next_transfer_stream(), and sync_streams().
std::vector<native_type> _pi_queue::transfer_streams_ |
Definition at line 398 of file pi_cuda.hpp.
Referenced by for_each_stream(), get_next_transfer_stream(), and sync_streams().