llvm-docs/doxygen/queue__impl_8cpp_source.html

 //==------------------ queue_impl.cpp - SYCL queue -------------------------==//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//


 #include <detail/event_impl.hpp>

 #include <detail/memory_manager.hpp>

 #include <detail/queue_impl.hpp>

 #include <sycl/context.hpp>

 #include <sycl/detail/common.hpp>

 #include <sycl/detail/ur.hpp>

 #include <sycl/device.hpp>


 #include <cstring>

 #include <utility>


 #ifdef XPTI_ENABLE_INSTRUMENTATION

 #include "xpti/xpti_trace_framework.hpp"

 #include <detail/xpti_registry.hpp>

 #include <sstream>

 #endif


 namespace sycl {

 inline namespace _V1 {

 namespace detail {

 // Treat 0 as reserved for host task traces

 std::atomic<unsigned long long> queue_impl::MNextAvailableQueueID = 1;


 thread_local bool NestedCallsDetector = false;

 class NestedCallsTracker {

 public:

   NestedCallsTracker() {

     if (NestedCallsDetector)

       throw sycl::exception(

           make_error_code(errc::invalid),

           "Calls to sycl::queue::submit cannot be nested. Command group "

           "function objects should use the sycl::handler API instead.");

     NestedCallsDetector = true;

   }


   ~NestedCallsTracker() { NestedCallsDetector = false; }

 };


 static std::vector<ur_event_handle_t>

 getUrEvents(const std::vector<sycl::event> &DepEvents) {

   std::vector<ur_event_handle_t> RetUrEvents;

   for (const sycl::event &Event : DepEvents) {

     const EventImplPtr &EventImpl = detail::getSyclObjImpl(Event);

     if (EventImpl->getHandleRef() != nullptr)

       RetUrEvents.push_back(EventImpl->getHandleRef());

   }

   return RetUrEvents;

 }


 template <>

 uint32_t queue_impl::get_info<info::queue::reference_count>() const {

   ur_result_t result = UR_RESULT_SUCCESS;

   getPlugin()->call(urQueueGetInfo, MQueues[0], UR_QUEUE_INFO_REFERENCE_COUNT,

                     sizeof(result), &result, nullptr);

   return result;

 }


 template <> context queue_impl::get_info<info::queue::context>() const {

   return get_context();

 }


 template <> device queue_impl::get_info<info::queue::device>() const {

   return get_device();

 }


 template <>

 typename info::platform::version::return_type

 queue_impl::get_backend_info<info::platform::version>() const {

   if (getContextImplPtr()->getBackend() != backend::opencl) {

     throw sycl::exception(errc::backend_mismatch,

                           "the info::platform::version info descriptor can "

                           "only be queried with an OpenCL backend");

   }

   return get_device().get_platform().get_info<info::platform::version>();

 }


 template <>

 typename info::device::version::return_type

 queue_impl::get_backend_info<info::device::version>() const {

   if (getContextImplPtr()->getBackend() != backend::opencl) {

     throw sycl::exception(errc::backend_mismatch,

                           "the info::device::version info descriptor can only "

                           "be queried with an OpenCL backend");

   }

   return get_device().get_info<info::device::version>();

 }


 template <>

 typename info::device::backend_version::return_type

 queue_impl::get_backend_info<info::device::backend_version>() const {

   if (getContextImplPtr()->getBackend() != backend::ext_oneapi_level_zero) {

     throw sycl::exception(errc::backend_mismatch,

                           "the info::device::backend_version info descriptor "

                           "can only be queried with a Level Zero backend");

   }

   return "";

   // Currently The Level Zero backend does not define the value of this

   // information descriptor and implementations are encouraged to return the

   // empty string as per specification.

 }


 static event prepareSYCLEventAssociatedWithQueue(

     const std::shared_ptr<detail::queue_impl> &QueueImpl) {

   auto EventImpl = std::make_shared<detail::event_impl>(QueueImpl);

   EventImpl->setContextImpl(detail::getSyclObjImpl(QueueImpl->get_context()));

   EventImpl->setStateIncomplete();

   return detail::createSyclObjFromImpl<event>(EventImpl);

 }


 static event createDiscardedEvent() {

   EventImplPtr EventImpl =

       std::make_shared<event_impl>(event_impl::HES_Discarded);

   return createSyclObjFromImpl<event>(EventImpl);

 }


 const std::vector<event> &

 queue_impl::getExtendDependencyList(const std::vector<event> &DepEvents,

                                     std::vector<event> &MutableVec,

                                     std::unique_lock<std::mutex> &QueueLock) {

   if (!isInOrder())

     return DepEvents;


   QueueLock.lock();

   EventImplPtr ExtraEvent = MGraph.expired() ? MDefaultGraphDeps.LastEventPtr

                                              : MExtGraphDeps.LastEventPtr;

   std::optional<event> ExternalEvent = popExternalEvent();


   if (!ExternalEvent && !ExtraEvent)

     return DepEvents;


   MutableVec = DepEvents;

   if (ExternalEvent)

     MutableVec.push_back(*ExternalEvent);

   if (ExtraEvent)

     MutableVec.push_back(detail::createSyclObjFromImpl<event>(ExtraEvent));

   return MutableVec;

 }


 event queue_impl::memset(const std::shared_ptr<detail::queue_impl> &Self,

                          void *Ptr, int Value, size_t Count,

                          const std::vector<event> &DepEvents,

                          bool CallerNeedsEvent) {

 #if XPTI_ENABLE_INSTRUMENTATION

   // We need a code pointer value and we use the object ptr; if code location

   // information is available, we will have function name and source file

   // information

   XPTIScope PrepareNotify((void *)this,

                           (uint16_t)xpti::trace_point_type_t::node_create,

                           SYCL_STREAM_NAME, "memory_transfer_node");

   PrepareNotify.addMetadata([&](auto TEvent) {

     xpti::addMetadata(TEvent, "sycl_device",

                       reinterpret_cast<size_t>(MDevice->getHandleRef()));

     xpti::addMetadata(TEvent, "memory_ptr", reinterpret_cast<size_t>(Ptr));

     xpti::addMetadata(TEvent, "value_set", Value);

     xpti::addMetadata(TEvent, "memory_size", Count);

     xpti::addMetadata(TEvent, "queue_id", MQueueID);

   });

   // Before we notifiy the subscribers, we broadcast the 'queue_id', which was a

   // metadata entry to TLS for use by callback handlers

   xpti::framework::stash_tuple(XPTI_QUEUE_INSTANCE_ID_KEY, MQueueID);

   // Notify XPTI about the memset submission

   PrepareNotify.notify();

   // Emit a begin/end scope for this call

   PrepareNotify.scopedNotify((uint16_t)xpti::trace_point_type_t::task_begin);

 #endif

   const std::vector<unsigned char> Pattern{static_cast<unsigned char>(Value)};

   return submitMemOpHelper(

       Self, DepEvents, CallerNeedsEvent,

       [&](handler &CGH) { CGH.memset(Ptr, Value, Count); },

       [](const auto &...Args) { MemoryManager::fill_usm(Args...); }, Ptr, Self,

       Count, Pattern);

 }


 void report(const code_location &CodeLoc) {

   std::cout << "Exception caught at ";

   if (CodeLoc.fileName())

     std::cout << "File: " << CodeLoc.fileName();

   if (CodeLoc.functionName())

     std::cout << " | Function: " << CodeLoc.functionName();

   if (CodeLoc.lineNumber())

     std::cout << " | Line: " << CodeLoc.lineNumber();

   if (CodeLoc.columnNumber())

     std::cout << " | Column: " << CodeLoc.columnNumber();

   std::cout << '\n';

 }


 event queue_impl::memcpy(const std::shared_ptr<detail::queue_impl> &Self,

                          void *Dest, const void *Src, size_t Count,

                          const std::vector<event> &DepEvents,

                          bool CallerNeedsEvent, const code_location &CodeLoc) {

 #if XPTI_ENABLE_INSTRUMENTATION

   // We need a code pointer value and we duse the object ptr; If code location

   // is available, we use the source file information along with the object

   // pointer.

   XPTIScope PrepareNotify((void *)this,

                           (uint16_t)xpti::trace_point_type_t::node_create,

                           SYCL_STREAM_NAME, "memory_transfer_node");

   PrepareNotify.addMetadata([&](auto TEvent) {

     xpti::addMetadata(TEvent, "sycl_device",

                       reinterpret_cast<size_t>(MDevice->getHandleRef()));

     xpti::addMetadata(TEvent, "src_memory_ptr", reinterpret_cast<size_t>(Src));

     xpti::addMetadata(TEvent, "dest_memory_ptr",

                       reinterpret_cast<size_t>(Dest));

     xpti::addMetadata(TEvent, "memory_size", Count);

     xpti::addMetadata(TEvent, "queue_id", MQueueID);

   });

   xpti::framework::stash_tuple(XPTI_QUEUE_INSTANCE_ID_KEY, MQueueID);

   // Notify XPTI about the memcpy submission

   PrepareNotify.notify();

   // Emit a begin/end scope for this call

   PrepareNotify.scopedNotify((uint16_t)xpti::trace_point_type_t::task_begin);

 #endif


   if ((!Src || !Dest) && Count != 0) {

     report(CodeLoc);

     throw exception(make_error_code(errc::invalid),

                     "NULL pointer argument in memory copy operation.");

   }

   return submitMemOpHelper(

       Self, DepEvents, CallerNeedsEvent,

       [&](handler &CGH) { CGH.memcpy(Dest, Src, Count); },

       [](const auto &...Args) { MemoryManager::copy_usm(Args...); }, Src, Self,

       Count, Dest);

 }


 event queue_impl::mem_advise(const std::shared_ptr<detail::queue_impl> &Self,

                              const void *Ptr, size_t Length,

                              ur_usm_advice_flags_t Advice,

                              const std::vector<event> &DepEvents,

                              bool CallerNeedsEvent) {

   return submitMemOpHelper(

       Self, DepEvents, CallerNeedsEvent,

       [&](handler &CGH) { CGH.mem_advise(Ptr, Length, Advice); },

       [](const auto &...Args) { MemoryManager::advise_usm(Args...); }, Ptr,

       Self, Length, Advice);

 }


 event queue_impl::memcpyToDeviceGlobal(

     const std::shared_ptr<detail::queue_impl> &Self, void *DeviceGlobalPtr,

     const void *Src, bool IsDeviceImageScope, size_t NumBytes, size_t Offset,

     const std::vector<event> &DepEvents, bool CallerNeedsEvent) {

   return submitMemOpHelper(

       Self, DepEvents, CallerNeedsEvent,

       [&](handler &CGH) {

         CGH.memcpyToDeviceGlobal(DeviceGlobalPtr, Src, IsDeviceImageScope,

                                  NumBytes, Offset);

       },

       [](const auto &...Args) {

         MemoryManager::copy_to_device_global(Args...);

       },

       DeviceGlobalPtr, IsDeviceImageScope, Self, NumBytes, Offset, Src);

 }


 event queue_impl::memcpyFromDeviceGlobal(

     const std::shared_ptr<detail::queue_impl> &Self, void *Dest,

     const void *DeviceGlobalPtr, bool IsDeviceImageScope, size_t NumBytes,

     size_t Offset, const std::vector<event> &DepEvents, bool CallerNeedsEvent) {

   return submitMemOpHelper(

       Self, DepEvents, CallerNeedsEvent,

       [&](handler &CGH) {

         CGH.memcpyFromDeviceGlobal(Dest, DeviceGlobalPtr, IsDeviceImageScope,

                                    NumBytes, Offset);

       },

       [](const auto &...Args) {

         MemoryManager::copy_from_device_global(Args...);

       },

       DeviceGlobalPtr, IsDeviceImageScope, Self, NumBytes, Offset, Dest);

 }


 event queue_impl::getLastEvent() {

   {

     // The external event is required to finish last if set, so it is considered

     // the last event if present.

     std::lock_guard<std::mutex> Lock(MInOrderExternalEventMtx);

     if (MInOrderExternalEvent)

       return *MInOrderExternalEvent;

   }


   std::lock_guard<std::mutex> Lock{MMutex};

   if (MDiscardEvents)

     return createDiscardedEvent();

   if (!MGraph.expired() && MExtGraphDeps.LastEventPtr)

     return detail::createSyclObjFromImpl<event>(MExtGraphDeps.LastEventPtr);

   if (!MDefaultGraphDeps.LastEventPtr)

     MDefaultGraphDeps.LastEventPtr = std::make_shared<event_impl>(std::nullopt);

   return detail::createSyclObjFromImpl<event>(MDefaultGraphDeps.LastEventPtr);

 }


 void queue_impl::addEvent(const event &Event) {

   EventImplPtr EImpl = getSyclObjImpl(Event);

   assert(EImpl && "Event implementation is missing");

   auto *Cmd = static_cast<Command *>(EImpl->getCommand());

   if (!Cmd) {

     // if there is no command on the event, we cannot track it with MEventsWeak

     // as that will leave it with no owner. Track in MEventsShared only if we're

     // unable to call urQueueFinish during wait.

     if (MEmulateOOO)

       addSharedEvent(Event);

   }

   // As long as the queue supports urQueueFinish we only need to store events

   // for unenqueued commands and host tasks.

   else if (MEmulateOOO || EImpl->getHandleRef() == nullptr) {

     std::weak_ptr<event_impl> EventWeakPtr{EImpl};

     std::lock_guard<std::mutex> Lock{MMutex};

     MEventsWeak.push_back(std::move(EventWeakPtr));

   }

 }


 void queue_impl::addSharedEvent(const event &Event) {

   assert(MEmulateOOO);

   std::lock_guard<std::mutex> Lock(MMutex);

   // Events stored in MEventsShared are not released anywhere else aside from

   // calls to queue::wait/wait_and_throw, which a user application might not

   // make, and ~queue_impl(). If the number of events grows large enough,

   // there's a good chance that most of them are already completed and ownership

   // of them can be released.

   const size_t EventThreshold = 128;

   if (MEventsShared.size() >= EventThreshold) {

     // Generally, the vector is ordered so that the oldest events are in the

     // front and the newer events are in the end.  So, search to find the first

     // event that isn't yet complete.  All the events prior to that can be

     // erased. This could leave some few events further on that have completed

     // not yet erased, but that is OK.  This cleanup doesn't have to be perfect.

     // This also keeps the algorithm linear rather than quadratic because it

     // doesn't continually recheck things towards the back of the list that

     // really haven't had time to complete.

     MEventsShared.erase(

         MEventsShared.begin(),

         std::find_if(

             MEventsShared.begin(), MEventsShared.end(), [](const event &E) {

               return E.get_info<info::event::command_execution_status>() !=

                      info::event_command_status::complete;

             }));

   }

   MEventsShared.push_back(Event);

 }


 event queue_impl::submit_impl(const std::function<void(handler &)> &CGF,

                               const std::shared_ptr<queue_impl> &Self,

                               const std::shared_ptr<queue_impl> &PrimaryQueue,

                               const std::shared_ptr<queue_impl> &SecondaryQueue,

                               bool CallerNeedsEvent,

                               const detail::code_location &Loc,

                               const SubmitPostProcessF *PostProcess) {

   handler Handler(Self, PrimaryQueue, SecondaryQueue, CallerNeedsEvent);

   Handler.saveCodeLoc(Loc);


   {

     NestedCallsTracker tracker;

     CGF(Handler);

   }


   // Scheduler will later omit events, that are not required to execute tasks.

   // Host and interop tasks, however, are not submitted to low-level runtimes

   // and require separate dependency management.

   const CGType Type = detail::getSyclObjImpl(Handler)->MCGType;

   event Event = detail::createSyclObjFromImpl<event>(

       std::make_shared<detail::event_impl>());

   std::vector<StreamImplPtr> Streams;

   if (Type == CGType::Kernel)

     Streams = std::move(Handler.MStreamStorage);


   if (PostProcess) {

     bool IsKernel = Type == CGType::Kernel;

     bool KernelUsesAssert = false;


     if (IsKernel)

       // Kernel only uses assert if it's non interop one

       KernelUsesAssert = !(Handler.MKernel && Handler.MKernel->isInterop()) &&

                          ProgramManager::getInstance().kernelUsesAssert(

                              Handler.MKernelName.c_str());

     finalizeHandler(Handler, Event);


     (*PostProcess)(IsKernel, KernelUsesAssert, Event);

   } else

     finalizeHandler(Handler, Event);


   addEvent(Event);


   auto EventImpl = detail::getSyclObjImpl(Event);

   for (auto &Stream : Streams) {

     // We don't want stream flushing to be blocking operation that is why submit

     // a host task to print stream buffer. It will fire up as soon as the kernel

     // finishes execution.

     event FlushEvent = submit_impl(

         [&](handler &ServiceCGH) { Stream->generateFlushCommand(ServiceCGH); },

         Self, PrimaryQueue, SecondaryQueue, /*CallerNeedsEvent*/ true, Loc, {});

     EventImpl->attachEventToComplete(detail::getSyclObjImpl(FlushEvent));

     registerStreamServiceEvent(detail::getSyclObjImpl(FlushEvent));

   }


   return Event;

 }


 template <typename HandlerFuncT>

 event queue_impl::submitWithHandler(const std::shared_ptr<queue_impl> &Self,

                                     const std::vector<event> &DepEvents,

                                     HandlerFuncT HandlerFunc) {

   return submit(

       [&](handler &CGH) {

         CGH.depends_on(DepEvents);

         HandlerFunc(CGH);

       },

       Self, {});

 }


 template <typename HandlerFuncT, typename MemOpFuncT, typename... MemOpArgTs>

 event queue_impl::submitMemOpHelper(const std::shared_ptr<queue_impl> &Self,

                                     const std::vector<event> &DepEvents,

                                     bool CallerNeedsEvent,

                                     HandlerFuncT HandlerFunc,

                                     MemOpFuncT MemOpFunc,

                                     MemOpArgTs... MemOpArgs) {

   // We need to submit command and update the last event under same lock if we

   // have in-order queue.

   {

     std::unique_lock<std::mutex> Lock(MMutex, std::defer_lock);


     std::vector<event> MutableDepEvents;

     const std::vector<event> &ExpandedDepEvents =

         getExtendDependencyList(DepEvents, MutableDepEvents, Lock);


     // If we have a command graph set we need to capture the op through the

     // handler rather than by-passing the scheduler.

     if (MGraph.expired() && Scheduler::areEventsSafeForSchedulerBypass(

                                 ExpandedDepEvents, MContext)) {

       if ((MDiscardEvents || !CallerNeedsEvent) &&

           supportsDiscardingPiEvents()) {

         NestedCallsTracker tracker;

         MemOpFunc(MemOpArgs..., getUrEvents(ExpandedDepEvents),

                   /*PiEvent*/ nullptr, /*EventImplPtr*/ nullptr);

         return createDiscardedEvent();

       }


       event ResEvent = prepareSYCLEventAssociatedWithQueue(Self);

       auto EventImpl = detail::getSyclObjImpl(ResEvent);

       {

         NestedCallsTracker tracker;

         MemOpFunc(MemOpArgs..., getUrEvents(ExpandedDepEvents),

                   &EventImpl->getHandleRef(), EventImpl);

       }


       if (isInOrder()) {

         auto &EventToStoreIn = MGraph.expired() ? MDefaultGraphDeps.LastEventPtr

                                                 : MExtGraphDeps.LastEventPtr;

         EventToStoreIn = EventImpl;

       }

       // Track only if we won't be able to handle it with urQueueFinish.

       if (MEmulateOOO)

         addSharedEvent(ResEvent);

       return discard_or_return(ResEvent);

     }

   }

   return submitWithHandler(Self, DepEvents, HandlerFunc);

 }


 void *queue_impl::instrumentationProlog(const detail::code_location &CodeLoc,

                                         std::string &Name, int32_t StreamID,

                                         uint64_t &IId) {

   void *TraceEvent = nullptr;

   (void)CodeLoc;

   (void)Name;

   (void)StreamID;

   (void)IId;

 #ifdef XPTI_ENABLE_INSTRUMENTATION

   constexpr uint16_t NotificationTraceType = xpti::trace_wait_begin;

   if (!xptiCheckTraceEnabled(StreamID, NotificationTraceType))

     return TraceEvent;


   xpti::payload_t Payload;

   bool HasSourceInfo = false;

   // We try to create a unique string for the wait() call by combining it with

   // the queue address

   xpti::utils::StringHelper NG;

   Name = NG.nameWithAddress<queue_impl *>("queue.wait", this);


   if (CodeLoc.fileName()) {

     // We have source code location information

     Payload =

         xpti::payload_t(Name.c_str(), CodeLoc.fileName(), CodeLoc.lineNumber(),

                         CodeLoc.columnNumber(), (void *)this);

     HasSourceInfo = true;

   } else {

     // We have no location information, so we'll use the address of the queue

     Payload = xpti::payload_t(Name.c_str(), (void *)this);

   }

   // wait() calls could be at different user-code locations; We create a new

   // event based on the code location info and if this has been seen before, a

   // previously created event will be returned.

   uint64_t QWaitInstanceNo = 0;

   xpti::trace_event_data_t *WaitEvent =

       xptiMakeEvent(Name.c_str(), &Payload, xpti::trace_graph_event,

                     xpti_at::active, &QWaitInstanceNo);

   IId = QWaitInstanceNo;

   if (WaitEvent) {

     xpti::addMetadata(WaitEvent, "sycl_device_type", queueDeviceToString(this));

     if (HasSourceInfo) {

       xpti::addMetadata(WaitEvent, "sym_function_name", CodeLoc.functionName());

       xpti::addMetadata(WaitEvent, "sym_source_file_name", CodeLoc.fileName());

       xpti::addMetadata(WaitEvent, "sym_line_no",

                         static_cast<int32_t>((CodeLoc.lineNumber())));

       xpti::addMetadata(WaitEvent, "sym_column_no",

                         static_cast<int32_t>((CodeLoc.columnNumber())));

     }

     xptiNotifySubscribers(StreamID, xpti::trace_wait_begin, nullptr, WaitEvent,

                           QWaitInstanceNo,

                           static_cast<const void *>(Name.c_str()));

     TraceEvent = (void *)WaitEvent;

   }

 #endif

   return TraceEvent;

 }


 void queue_impl::instrumentationEpilog(void *TelemetryEvent, std::string &Name,

                                        int32_t StreamID, uint64_t IId) {

   (void)TelemetryEvent;

   (void)Name;

   (void)StreamID;

   (void)IId;

 #ifdef XPTI_ENABLE_INSTRUMENTATION

   constexpr uint16_t NotificationTraceType = xpti::trace_wait_end;

   if (!(xptiCheckTraceEnabled(StreamID, NotificationTraceType) &&

         TelemetryEvent))

     return;

   // Close the wait() scope

   xpti::trace_event_data_t *TraceEvent =

       (xpti::trace_event_data_t *)TelemetryEvent;

   xptiNotifySubscribers(StreamID, NotificationTraceType, nullptr, TraceEvent,

                         IId, static_cast<const void *>(Name.c_str()));

 #endif

 }


 void queue_impl::wait(const detail::code_location &CodeLoc) {

   (void)CodeLoc;

 #ifdef XPTI_ENABLE_INSTRUMENTATION

   void *TelemetryEvent = nullptr;

   uint64_t IId;

   std::string Name;

   int32_t StreamID = xptiRegisterStream(SYCL_STREAM_NAME);

   TelemetryEvent = instrumentationProlog(CodeLoc, Name, StreamID, IId);

 #endif


   if (MGraph.lock()) {

     throw sycl::exception(make_error_code(errc::invalid),

                           "wait cannot be called for a queue which is "

                           "recording to a command graph.");

   }


   // If there is an external event set, we know we are using an in-order queue

   // and the event is required to finish after the last event in the queue. As

   // such, we can just wait for it and finish.

   std::optional<event> ExternalEvent = popExternalEvent();

   if (ExternalEvent) {

     ExternalEvent->wait();


     // Additionally, we can clean up the event lists that we would have

     // otherwise cleared.

     if (!MEventsWeak.empty() || !MEventsShared.empty()) {

       std::lock_guard<std::mutex> Lock(MMutex);

       MEventsWeak.clear();

       MEventsShared.clear();

     }

     if (!MStreamsServiceEvents.empty()) {

       std::lock_guard<std::mutex> Lock(MStreamsServiceEventsMutex);

       MStreamsServiceEvents.clear();

     }

   }


   std::vector<std::weak_ptr<event_impl>> WeakEvents;

   std::vector<event> SharedEvents;

   {

     std::lock_guard<std::mutex> Lock(MMutex);

     WeakEvents.swap(MEventsWeak);

     SharedEvents.swap(MEventsShared);


     {

       std::lock_guard<std::mutex> RequestLock(MMissedCleanupRequestsMtx);

       for (auto &UpdatedGraph : MMissedCleanupRequests)

         doUnenqueuedCommandCleanup(UpdatedGraph);

       MMissedCleanupRequests.clear();

     }

   }

   // If the queue is either a host one or does not support OOO (and we use

   // multiple in-order queues as a result of that), wait for each event

   // directly. Otherwise, only wait for unenqueued or host task events, starting

   // from the latest submitted task in order to minimize total amount of calls,

   // then handle the rest with urQueueFinish.

   const bool SupportsPiFinish = !MEmulateOOO;

   for (auto EventImplWeakPtrIt = WeakEvents.rbegin();

        EventImplWeakPtrIt != WeakEvents.rend(); ++EventImplWeakPtrIt) {

     if (std::shared_ptr<event_impl> EventImplSharedPtr =

             EventImplWeakPtrIt->lock()) {

       // A nullptr UR event indicates that urQueueFinish will not cover it,

       // either because it's a host task event or an unenqueued one.

       if (!SupportsPiFinish || nullptr == EventImplSharedPtr->getHandleRef()) {

         EventImplSharedPtr->wait(EventImplSharedPtr);

       }

     }

   }

   if (SupportsPiFinish) {

     const PluginPtr &Plugin = getPlugin();

     Plugin->call(urQueueFinish, getHandleRef());

     assert(SharedEvents.empty() && "Queues that support calling piQueueFinish "

                                    "shouldn't have shared events");

   } else {

     for (event &Event : SharedEvents)

       Event.wait();

   }


   std::vector<EventImplPtr> StreamsServiceEvents;

   {

     std::lock_guard<std::mutex> Lock(MStreamsServiceEventsMutex);

     StreamsServiceEvents.swap(MStreamsServiceEvents);

   }

   for (const EventImplPtr &Event : StreamsServiceEvents)

     Event->wait(Event);


 #ifdef XPTI_ENABLE_INSTRUMENTATION

   instrumentationEpilog(TelemetryEvent, Name, StreamID, IId);

 #endif

 }


 ur_native_handle_t queue_impl::getNative(int32_t &NativeHandleDesc) const {

   const PluginPtr &Plugin = getPlugin();

   if (getContextImplPtr()->getBackend() == backend::opencl)

     Plugin->call(urQueueRetain, MQueues[0]);

   ur_native_handle_t Handle{};

   ur_queue_native_desc_t UrNativeDesc{UR_STRUCTURE_TYPE_QUEUE_NATIVE_DESC,

                                       nullptr, nullptr};

   UrNativeDesc.pNativeData = &NativeHandleDesc;


   Plugin->call(urQueueGetNativeHandle, MQueues[0], &UrNativeDesc, &Handle);

   return Handle;

 }


 void queue_impl::cleanup_fusion_cmd() {

   // Clean up only if a scheduler instance exits.

   if (detail::Scheduler::isInstanceAlive())

     detail::Scheduler::getInstance().cleanUpCmdFusion(this);

 }


 bool queue_impl::ext_oneapi_empty() const {

   // If we have in-order queue where events are not discarded then just check

   // the status of the last event.

   if (isInOrder() && !MDiscardEvents) {

     std::lock_guard<std::mutex> Lock(MMutex);

     // If there is no last event we know that no work has been submitted, so it

     // must be trivially empty.

     if (!MDefaultGraphDeps.LastEventPtr)

       return true;

     // Otherwise, check if the last event is finished.

     // Note that we fall back to the backend query if the event was discarded,

     // which may happend despite the queue not being a discard event queue.

     if (!MDefaultGraphDeps.LastEventPtr->isDiscarded())

       return MDefaultGraphDeps.LastEventPtr

                  ->get_info<info::event::command_execution_status>() ==

              info::event_command_status::complete;

   }


   // Check the status of the backend queue if this is not a host queue.

   ur_bool_t IsReady = false;

   getPlugin()->call(urQueueGetInfo, MQueues[0], UR_QUEUE_INFO_EMPTY,

                     sizeof(IsReady), &IsReady, nullptr);

   if (!IsReady)

     return false;


   // We may have events like host tasks which are not submitted to the backend

   // queue so we need to get their status separately.

   std::lock_guard<std::mutex> Lock(MMutex);

   for (event Event : MEventsShared)

     if (Event.get_info<info::event::command_execution_status>() !=

         info::event_command_status::complete)

       return false;


   for (auto EventImplWeakPtrIt = MEventsWeak.begin();

        EventImplWeakPtrIt != MEventsWeak.end(); ++EventImplWeakPtrIt)

     if (std::shared_ptr<event_impl> EventImplSharedPtr =

             EventImplWeakPtrIt->lock())

       if (EventImplSharedPtr->isHost() &&

           EventImplSharedPtr

                   ->get_info<info::event::command_execution_status>() !=

               info::event_command_status::complete)

         return false;


   // If we didn't exit early above then it means that all events in the queue

   // are completed.

   return true;

 }


 event queue_impl::discard_or_return(const event &Event) {

   if (!(MDiscardEvents))

     return Event;

   return createDiscardedEvent();

 }


 void queue_impl::revisitUnenqueuedCommandsState(

     const EventImplPtr &CompletedHostTask) {

   if (MIsInorder)

     return;

   std::unique_lock<std::mutex> Lock{MMutex, std::try_to_lock};

   if (Lock.owns_lock())

     doUnenqueuedCommandCleanup(CompletedHostTask->getCommandGraph());

   else {

     std::lock_guard<std::mutex> RequestLock(MMissedCleanupRequestsMtx);

     MMissedCleanupRequests.push_back(CompletedHostTask->getCommandGraph());

   }

 }


 void queue_impl::doUnenqueuedCommandCleanup(

     const std::shared_ptr<ext::oneapi::experimental::detail::graph_impl>

         &Graph) {

   auto tryToCleanup = [](DependencyTrackingItems &Deps) {

     if (Deps.LastBarrier && Deps.LastBarrier->isEnqueued()) {

       Deps.LastBarrier = nullptr;

       Deps.UnenqueuedCmdEvents.clear();

     } else {

       if (Deps.UnenqueuedCmdEvents.empty())

         return;

       Deps.UnenqueuedCmdEvents.erase(

           std::remove_if(

               Deps.UnenqueuedCmdEvents.begin(), Deps.UnenqueuedCmdEvents.end(),

               [](const EventImplPtr &CommandEvent) {

                 return (CommandEvent->isHost() ? CommandEvent->isCompleted()

                                                : CommandEvent->isEnqueued());

               }),

           Deps.UnenqueuedCmdEvents.end());

     }

   };

   // Barrier enqueue could be significantly postponed due to host task

   // dependency if any. No guarantee that it will happen while same graph deps

   // are still recording.

   if (Graph && Graph == getCommandGraph())

     tryToCleanup(MExtGraphDeps);

   else

     tryToCleanup(MDefaultGraphDeps);

 }


 } // namespace detail

 } // namespace _V1

 } // namespace sycl

sycl::_V1::context
The context class represents a SYCL context on which kernel functions may be executed.
Definition: context.hpp:50

sycl::_V1::detail::Command
The Command class represents some action that needs to be performed on one or more memory objects.
Definition: commands.hpp:109

sycl::_V1::detail::MemoryManager::copy_to_device_global
static void copy_to_device_global(const void *DeviceGlobalPtr, bool IsDeviceImageScoped, QueueImplPtr Queue, size_t NumBytes, size_t Offset, const void *SrcMem, const std::vector< ur_event_handle_t > &DepEvents, ur_event_handle_t *OutEvent, const detail::EventImplPtr &OutEventImpl)
Definition: memory_manager.cpp:1256

sycl::_V1::detail::MemoryManager::advise_usm
static void advise_usm(const void *Ptr, QueueImplPtr Queue, size_t Len, ur_usm_advice_flags_t Advice, std::vector< ur_event_handle_t > DepEvents, ur_event_handle_t *OutEvent, const detail::EventImplPtr &OutEventImpl)
Definition: memory_manager.cpp:974

sycl::_V1::detail::MemoryManager::copy_usm
static void copy_usm(const void *SrcMem, QueueImplPtr Queue, size_t Len, void *DstMem, std::vector< ur_event_handle_t > DepEvents, ur_event_handle_t *OutEvent, const detail::EventImplPtr &OutEventImpl)
Definition: memory_manager.cpp:907

sycl::_V1::detail::MemoryManager::fill_usm
static void fill_usm(void *DstMem, QueueImplPtr Queue, size_t Len, const std::vector< unsigned char > &Pattern, std::vector< ur_event_handle_t > DepEvents, ur_event_handle_t *OutEvent, const detail::EventImplPtr &OutEventImpl)
Definition: memory_manager.cpp:935

sycl::_V1::detail::MemoryManager::copy_from_device_global
static void copy_from_device_global(const void *DeviceGlobalPtr, bool IsDeviceImageScoped, QueueImplPtr Queue, size_t NumBytes, size_t Offset, void *DstMem, const std::vector< ur_event_handle_t > &DepEvents, ur_event_handle_t *OutEvent, const detail::EventImplPtr &OutEventImpl)
Definition: memory_manager.cpp:1278

sycl::_V1::detail::NestedCallsTracker
Definition: queue_impl.cpp:33

sycl::_V1::detail::NestedCallsTracker::NestedCallsTracker
NestedCallsTracker()
Definition: queue_impl.cpp:35

sycl::_V1::detail::NestedCallsTracker::~NestedCallsTracker
~NestedCallsTracker()
Definition: queue_impl.cpp:44

sycl::_V1::detail::ProgramManager::getInstance
static ProgramManager & getInstance()
Definition: program_manager.cpp:70

sycl::_V1::detail::ProgramManager::kernelUsesAssert
bool kernelUsesAssert(const std::string &KernelName) const
Definition: program_manager.cpp:1569

sycl::_V1::detail::Scheduler::getInstance
static Scheduler & getInstance()
Definition: scheduler.cpp:248

sycl::_V1::detail::Scheduler::cleanUpCmdFusion
void cleanUpCmdFusion(sycl::detail::queue_impl *Queue)
Definition: scheduler.cpp:593

sycl::_V1::detail::Scheduler::isInstanceAlive
static bool isInstanceAlive()
Definition: scheduler.cpp:252

sycl::_V1::detail::Scheduler::areEventsSafeForSchedulerBypass
static bool areEventsSafeForSchedulerBypass(const std::vector< sycl::event > &DepEvents, ContextImplPtr Context)
Definition: scheduler.cpp:734

sycl::_V1::detail::event_impl::HES_Discarded
@ HES_Discarded
Definition: event_impl.hpp:43

sycl::_V1::detail::queue_impl
Definition: queue_impl.hpp:71

sycl::_V1::detail::queue_impl::discard_or_return
event discard_or_return(const event &Event)
Definition: queue_impl.cpp:701

sycl::_V1::detail::queue_impl::MMissedCleanupRequests
std::deque< std::shared_ptr< ext::oneapi::experimental::detail::graph_impl > > MMissedCleanupRequests
Definition: queue_impl.hpp:1034

sycl::_V1::detail::queue_impl::isInOrder
bool isInOrder() const
Definition: queue_impl.hpp:362

sycl::_V1::detail::queue_impl::submit
event submit(const std::function< void(handler &)> &CGF, const std::shared_ptr< queue_impl > &Self, const std::shared_ptr< queue_impl > &SecondQueue, const detail::code_location &Loc, const SubmitPostProcessF *PostProcess=nullptr)
Submits a command group function object to the queue, in order to be scheduled for execution on the d...
Definition: queue_impl.hpp:404

sycl::_V1::detail::queue_impl::revisitUnenqueuedCommandsState
void revisitUnenqueuedCommandsState(const EventImplPtr &CompletedHostTask)
Definition: queue_impl.cpp:707

sycl::_V1::detail::queue_impl::MStreamsServiceEvents
std::vector< EventImplPtr > MStreamsServiceEvents
Definition: queue_impl.hpp:997

sycl::_V1::detail::queue_impl::submitMemOpHelper
event submitMemOpHelper(const std::shared_ptr< queue_impl > &Self, const std::vector< event > &DepEvents, bool CallerNeedsEvent, HandlerFuncT HandlerFunc, MemMngrFuncT MemMngrFunc, MemMngrArgTs... MemOpArgs)
Performs submission of a memory operation directly if scheduler can be bypassed, or with a handler ot...

sycl::_V1::detail::queue_impl::MInOrderExternalEvent
std::optional< event > MInOrderExternalEvent
Definition: queue_impl.hpp:1017

sycl::_V1::detail::queue_impl::getLastEvent
event getLastEvent()
Definition: queue_impl.cpp:278

sycl::_V1::detail::queue_impl::popExternalEvent
std::optional< event > popExternalEvent()
Definition: queue_impl.hpp:756

sycl::_V1::detail::queue_impl::registerStreamServiceEvent
void registerStreamServiceEvent(const EventImplPtr &Event)
Definition: queue_impl.hpp:707

sycl::_V1::detail::queue_impl::MNextAvailableQueueID
static std::atomic< unsigned long long > MNextAvailableQueueID
Definition: queue_impl.hpp:1031

sycl::_V1::detail::queue_impl::addEvent
void addEvent(const event &Event)
Stores an event that should be associated with the queue.
Definition: queue_impl.cpp:297

sycl::_V1::detail::queue_impl::MExtGraphDeps
struct sycl::_V1::detail::queue_impl::DependencyTrackingItems MExtGraphDeps

sycl::_V1::detail::queue_impl::MQueueID
unsigned long long MQueueID
Definition: queue_impl.hpp:1030

sycl::_V1::detail::queue_impl::MEventsWeak
std::vector< std::weak_ptr< event_impl > > MEventsWeak
These events are tracked, but not owned, by the queue.
Definition: queue_impl.hpp:959

sycl::_V1::detail::queue_impl::MEventsShared
std::vector< event > MEventsShared
Events without data dependencies (such as USM) need an owner, additionally, USM operations are not ad...
Definition: queue_impl.hpp:964

sycl::_V1::detail::queue_impl::MMissedCleanupRequestsMtx
std::mutex MMissedCleanupRequestsMtx
Definition: queue_impl.hpp:1035

sycl::_V1::detail::queue_impl::getNative
ur_native_handle_t getNative(int32_t &NativeHandleDesc) const
Gets the native handle of the SYCL queue.
Definition: queue_impl.cpp:634

sycl::_V1::detail::queue_impl::MMutex
std::mutex MMutex
Protects all the fields that can be changed by class' methods.
Definition: queue_impl.hpp:953

sycl::_V1::detail::queue_impl::cleanup_fusion_cmd
void cleanup_fusion_cmd()
Definition: queue_impl.cpp:647

sycl::_V1::detail::queue_impl::memcpyToDeviceGlobal
event memcpyToDeviceGlobal(const std::shared_ptr< queue_impl > &Self, void *DeviceGlobalPtr, const void *Src, bool IsDeviceImageScope, size_t NumBytes, size_t Offset, const std::vector< event > &DepEvents, bool CallerNeedsEvent)
Definition: queue_impl.cpp:246

sycl::_V1::detail::queue_impl::MIsInorder
const bool MIsInorder
Definition: queue_impl.hpp:995

sycl::_V1::detail::queue_impl::supportsDiscardingPiEvents
bool supportsDiscardingPiEvents() const
Definition: queue_impl.hpp:360

sycl::_V1::detail::queue_impl::submitWithHandler
event submitWithHandler(const std::shared_ptr< queue_impl > &Self, const std::vector< event > &DepEvents, HandlerFuncT HandlerFunc)
Helper function for submitting a memory operation with a handler.
Definition: queue_impl.cpp:407

sycl::_V1::detail::queue_impl::doUnenqueuedCommandCleanup
void doUnenqueuedCommandCleanup(const std::shared_ptr< ext::oneapi::experimental::detail::graph_impl > &Graph)
Definition: queue_impl.cpp:720

sycl::_V1::detail::queue_impl::submit_impl
event submit_impl(const std::function< void(handler &)> &CGF, const std::shared_ptr< queue_impl > &Self, const std::shared_ptr< queue_impl > &PrimaryQueue, const std::shared_ptr< queue_impl > &SecondaryQueue, bool CallerNeedsEvent, const detail::code_location &Loc, const SubmitPostProcessF *PostProcess)
Performs command group submission to the queue.
Definition: queue_impl.cpp:349

sycl::_V1::detail::queue_impl::SubmitPostProcessF
std::function< void(bool, bool, event &)> SubmitPostProcessF
Definition: queue_impl.hpp:389

sycl::_V1::detail::queue_impl::mem_advise
event mem_advise(const std::shared_ptr< queue_impl > &Self, const void *Ptr, size_t Length, ur_usm_advice_flags_t Advice, const std::vector< event > &DepEvents, bool CallerNeedsEvent)
Provides additional information to the underlying runtime about how different allocations are used.
Definition: queue_impl.cpp:234

sycl::_V1::detail::queue_impl::memcpyFromDeviceGlobal
event memcpyFromDeviceGlobal(const std::shared_ptr< queue_impl > &Self, void *Dest, const void *DeviceGlobalPtr, bool IsDeviceImageScope, size_t NumBytes, size_t Offset, const std::vector< event > &DepEvents, bool CallerNeedsEvent)
Definition: queue_impl.cpp:262

sycl::_V1::detail::queue_impl::addSharedEvent
void addSharedEvent(const event &Event)
queue_impl.addEvent tracks events with weak pointers but some events have no other owners.
Definition: queue_impl.cpp:320

sycl::_V1::detail::queue_impl::MContext
const ContextImplPtr MContext
Definition: queue_impl.hpp:956

sycl::_V1::detail::queue_impl::MQueues
std::vector< ur_queue_handle_t > MQueues
List of queues created for FPGA device from a single SYCL queue.
Definition: queue_impl.hpp:970

sycl::_V1::detail::queue_impl::finalizeHandler
void finalizeHandler(HandlerType &Handler, event &EventRet)
Definition: queue_impl.hpp:807

sycl::_V1::detail::queue_impl::MDevice
DeviceImplPtr MDevice
Definition: queue_impl.hpp:955

sycl::_V1::detail::queue_impl::MInOrderExternalEventMtx
std::mutex MInOrderExternalEventMtx
Definition: queue_impl.hpp:1018

sycl::_V1::detail::queue_impl::getPlugin
const PluginPtr & getPlugin() const
Definition: queue_impl.hpp:347

sycl::_V1::detail::queue_impl::ext_oneapi_empty
bool ext_oneapi_empty() const
Definition: queue_impl.cpp:653

sycl::_V1::detail::queue_impl::MDiscardEvents
const bool MDiscardEvents
Definition: queue_impl.hpp:1022

sycl::_V1::detail::queue_impl::wait
void wait(const detail::code_location &Loc={})
Performs a blocking wait for the completion of all enqueued tasks in the queue.
Definition: queue_impl.cpp:544

sycl::_V1::detail::queue_impl::getCommandGraph
std::shared_ptr< ext::oneapi::experimental::detail::graph_impl > getCommandGraph() const
Definition: queue_impl.hpp:745

sycl::_V1::detail::queue_impl::MDefaultGraphDeps
struct sycl::_V1::detail::queue_impl::DependencyTrackingItems MDefaultGraphDeps

sycl::_V1::detail::queue_impl::MEmulateOOO
bool MEmulateOOO
Indicates that a native out-of-order queue could not be created and we need to emulate it with multip...
Definition: queue_impl.hpp:976

sycl::_V1::detail::queue_impl::instrumentationEpilog
void instrumentationEpilog(void *TelementryEvent, std::string &Name, int32_t StreamID, uint64_t IId)
Definition: queue_impl.cpp:525

sycl::_V1::detail::queue_impl::getContextImplPtr
const ContextImplPtr & getContextImplPtr() const
Definition: queue_impl.hpp:349

sycl::_V1::detail::queue_impl::instrumentationProlog
void * instrumentationProlog(const detail::code_location &CodeLoc, std::string &Name, int32_t StreamID, uint64_t &iid)
Definition: queue_impl.cpp:468

sycl::_V1::detail::queue_impl::getHandleRef
ur_queue_handle_t & getHandleRef()
Definition: queue_impl.hpp:627

sycl::_V1::detail::queue_impl::MStreamsServiceEventsMutex
std::mutex MStreamsServiceEventsMutex
Definition: queue_impl.hpp:998

sycl::_V1::detail::queue_impl::MGraph
std::weak_ptr< ext::oneapi::experimental::detail::graph_impl > MGraph
Definition: queue_impl.hpp:1028

sycl::_V1::detail::queue_impl::memset
event memset(const std::shared_ptr< queue_impl > &Self, void *Ptr, int Value, size_t Count, const std::vector< event > &DepEvents, bool CallerNeedsEvent)
Fills the memory pointed by a USM pointer with the value specified.
Definition: queue_impl.cpp:147

sycl::_V1::detail::queue_impl::memcpy
event memcpy(const std::shared_ptr< queue_impl > &Self, void *Dest, const void *Src, size_t Count, const std::vector< event > &DepEvents, bool CallerNeedsEvent, const code_location &CodeLoc)
Copies data from one memory region to another, both pointed by USM pointers.
Definition: queue_impl.cpp:195

sycl::_V1::detail::queue_impl::getExtendDependencyList
const std::vector< event > & getExtendDependencyList(const std::vector< event > &DepEvents, std::vector< event > &MutableVec, std::unique_lock< std::mutex > &QueueLock)
Definition: queue_impl.cpp:125

sycl::_V1::detail::string::c_str
const char * c_str() const noexcept
Definition: string.hpp:60

sycl::_V1::device
The SYCL device class encapsulates a single SYCL device on which kernels may be executed.
Definition: device.hpp:64

sycl::event
An event object can be used to synchronize memory transfers, enqueues of kernels and signaling barrie...
Definition: event.hpp:44

sycl::exception
Definition: exception.hpp:75

sycl::_V1::handler
Command group handler class.
Definition: handler.hpp:467

sycl::_V1::handler::depends_on
void depends_on(event Event)
Registers event dependencies on this command group.
Definition: handler.cpp:1529

sycl::_V1::handler::memcpy
void memcpy(void *Dest, const void *Src, size_t Count)
Copies data from one memory region to another, each is either a host pointer or a pointer within USM ...
Definition: handler.cpp:934

sycl::_V1::handler::mem_advise
void mem_advise(const void *Ptr, size_t Length, int Advice)
Provides additional information to the underlying runtime about how different allocations are used.
Definition: handler.cpp:958

sycl::_V1::handler::memset
void memset(void *Dest, int Value, size_t Count)
Fills the memory pointed by a USM pointer with the value specified.
Definition: handler.cpp:942

context.hpp

common.hpp

event_impl.hpp

memory_manager.hpp

std::cout
__SYCL_EXTERN_STREAM_ATTRS ostream cout
Linked to standard output.

sycl::_V1::detail::NestedCallsDetector
thread_local bool NestedCallsDetector
Definition: queue_impl.cpp:32

sycl::_V1::detail::getSyclObjImpl
decltype(Obj::impl) const  & getSyclObjImpl(const Obj &SyclObject)
Definition: impl_utils.hpp:31

sycl::_V1::detail::SYCL_STREAM_NAME
constexpr const char * SYCL_STREAM_NAME
Definition: xpti_registry.hpp:29

sycl::_V1::detail::createDiscardedEvent
static event createDiscardedEvent()
Definition: queue_impl.cpp:118

sycl::_V1::detail::getPlugin
static const PluginPtr & getPlugin(backend Backend)
Definition: backend.cpp:32

sycl::_V1::detail::getUrEvents
static std::vector< ur_event_handle_t > getUrEvents(const std::vector< sycl::event > &DepEvents)
Definition: queue_impl.cpp:48

sycl::_V1::detail::EventImplPtr
std::shared_ptr< event_impl > EventImplPtr
Definition: handler.hpp:183

sycl::_V1::detail::PluginPtr
std::shared_ptr< plugin > PluginPtr
Definition: ur.hpp:60

sycl::_V1::detail::CGType
CGType
Type of the command group.
Definition: cg_types.hpp:42

sycl::_V1::detail::CGType::Kernel
@ Kernel

sycl::_V1::detail::report
void report(const code_location &CodeLoc)
Definition: queue_impl.cpp:182

sycl::_V1::detail::prepareSYCLEventAssociatedWithQueue
static event prepareSYCLEventAssociatedWithQueue(const std::shared_ptr< detail::queue_impl > &QueueImpl)
Definition: queue_impl.cpp:110

sycl::_V1::detail::queueDeviceToString
std::string queueDeviceToString(const queue_impl *const &Queue)
Definition: xpti_registry.cpp:366

sycl::_V1::info::event_command_status::complete
@ complete

sycl::_V1::errc::backend_mismatch
@ backend_mismatch

sycl::_V1::errc::invalid
@ invalid

sycl::_V1::backend::opencl
@ opencl

sycl::_V1::backend::ext_oneapi_level_zero
@ ext_oneapi_level_zero

sycl::_V1::make_error_code
std::error_code make_error_code(sycl::errc E) noexcept
Constructs an error code using e and sycl_category()
Definition: exception.cpp:65

sycl
Definition: access.hpp:18

syclcompat::get_device
static device_ext & get_device(unsigned int id)
Util function to get a device by id.
Definition: device.hpp:905

queue_impl.hpp

sycl::_V1::detail::code_location
Definition: common.hpp:66

sycl::_V1::detail::code_location::columnNumber
constexpr unsigned long columnNumber() const noexcept
Definition: common.hpp:88

sycl::_V1::detail::code_location::fileName
constexpr const char * fileName() const noexcept
Definition: common.hpp:89

sycl::_V1::detail::code_location::functionName
constexpr const char * functionName() const noexcept
Definition: common.hpp:90

sycl::_V1::detail::code_location::lineNumber
constexpr unsigned long lineNumber() const noexcept
Definition: common.hpp:87

sycl::_V1::detail::queue_impl::DependencyTrackingItems
Definition: queue_impl.hpp:979

sycl::_V1::detail::queue_impl::DependencyTrackingItems::LastEventPtr
EventImplPtr LastEventPtr
Definition: queue_impl.hpp:982

device.hpp

ur.hpp
C++ utilities for Unified Runtime integration.

xpti_registry.hpp