DPC++ Runtime
Runtime libraries for oneAPI DPC++
pi_cuda.cpp
Go to the documentation of this file.
1 //==---------- pi_cuda.cpp - CUDA Plugin -----------------------------------==//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
13 
14 #include <pi_cuda.hpp>
16 #include <sycl/detail/defines.hpp>
17 #include <sycl/detail/pi.hpp>
18 
19 // Forward declarations
20 void enableCUDATracing();
21 
22 //-- PI API implementation
23 extern "C" {
24 
26  pi_uint32 *NumPlatforms) {
27  return pi2ur::piPlatformsGet(NumEntries, Platforms, NumPlatforms);
28 }
29 
31  size_t ParamValueSize, void *ParamValue,
32  size_t *ParamValueSizeRet) {
33  return pi2ur::piPlatformGetInfo(Platform, ParamName, ParamValueSize,
34  ParamValue, ParamValueSizeRet);
35 }
36 
38  pi_native_handle *NativeHandle) {
39  return pi2ur::piextPlatformGetNativeHandle(Platform, NativeHandle);
40 }
41 
43  pi_platform *Platform) {
44  return pi2ur::piextPlatformCreateWithNativeHandle(NativeHandle, Platform);
45 }
46 
48  return pi2ur::piPluginGetLastError(message);
49 }
50 
52  const char *frontend_option,
53  const char **backend_option) {
54  return pi2ur::piPluginGetBackendOption(platform, frontend_option,
55  backend_option);
56 }
57 
59  pi_uint32 NumEntries, pi_device *Devices,
60  pi_uint32 *NumDevices) {
61  return pi2ur::piDevicesGet(Platform, DeviceType, NumEntries, Devices,
62  NumDevices);
63 }
64 
66  return pi2ur::piDeviceRetain(Device);
67 }
68 
70  return pi2ur::piDeviceRelease(Device);
71 }
72 
74  size_t ParamValueSize, void *ParamValue,
75  size_t *ParamValueSizeRet) {
76  return pi2ur::piDeviceGetInfo(Device, ParamName, ParamValueSize, ParamValue,
77  ParamValueSizeRet);
78 }
79 
81  const pi_device_partition_property *Properties,
82  pi_uint32 NumDevices, pi_device *OutDevices,
83  pi_uint32 *OutNumDevices) {
84  return pi2ur::piDevicePartition(Device, Properties, NumDevices, OutDevices,
85  OutNumDevices);
86 }
87 
89  pi_uint32 NumBinaries,
90  pi_uint32 *SelectedBinaryInd) {
91  return pi2ur::piextDeviceSelectBinary(Device, Binaries, NumBinaries,
92  SelectedBinaryInd);
93 }
94 
96  pi_native_handle *NativeHandle) {
97 
98  return pi2ur::piextDeviceGetNativeHandle(Device, NativeHandle);
99 }
100 
102  pi_platform Platform,
103  pi_device *Device) {
104 
105  return pi2ur::piextDeviceCreateWithNativeHandle(NativeHandle, Platform,
106  Device);
107 }
108 
110  pi_uint32 NumDevices, const pi_device *Devices,
111  void (*PFnNotify)(const char *ErrInfo,
112  const void *PrivateInfo, size_t CB,
113  void *UserData),
114  void *UserData, pi_context *RetContext) {
115  return pi2ur::piContextCreate(Properties, NumDevices, Devices, PFnNotify,
116  UserData, RetContext);
117 }
118 
120  size_t ParamValueSize, void *ParamValue,
121  size_t *ParamValueSizeRet) {
122 
123  return pi2ur::piContextGetInfo(Context, ParamName, ParamValueSize, ParamValue,
124  ParamValueSizeRet);
125 }
126 
129  void *UserData) {
130  return pi2ur::piextContextSetExtendedDeleter(Context, Function, UserData);
131 }
132 
134  pi_native_handle *NativeHandle) {
135  return pi2ur::piextContextGetNativeHandle(Context, NativeHandle);
136 }
137 
139  pi_uint32 NumDevices,
140  const pi_device *Devices,
141  bool OwnNativeHandle,
142  pi_context *RetContext) {
144  NativeHandle, NumDevices, Devices, OwnNativeHandle, RetContext);
145 }
146 
148 
149  return pi2ur::piContextRetain(Context);
150 }
151 
153  return pi2ur::piContextRelease(Context);
154 }
155 
157  pi_queue_properties Flags, pi_queue *Queue) {
158  pi_queue_properties Properties[] = {PI_QUEUE_FLAGS, Flags, 0};
159  return piextQueueCreate(Context, Device, Properties, Queue);
160 }
161 
163  pi_queue_properties *Properties, pi_queue *Queue) {
164  return pi2ur::piextQueueCreate(Context, Device, Properties, Queue);
165 }
166 
168  size_t ParamValueSize, void *ParamValue,
169  size_t *ParamValueSizeRet) {
170 
171  return pi2ur::piQueueGetInfo(Queue, ParamName, ParamValueSize, ParamValue,
172  ParamValueSizeRet);
173 }
174 
176 
178  return pi2ur::piQueueRelease(Queue);
179 }
180 
182 
184 
186  pi_native_handle *NativeHandle,
187  int32_t *NativeHandleDesc) {
188 
189  return pi2ur::piextQueueGetNativeHandle(Queue, NativeHandle,
190  NativeHandleDesc);
191 }
192 
194  int32_t NativeHandleDesc,
195  pi_context Context, pi_device Device,
196  bool OwnNativeHandle,
197  pi_queue_properties *Properties,
198  pi_queue *Queue) {
199 
201  NativeHandle, NativeHandleDesc, Context, Device, OwnNativeHandle,
202  Properties, Queue);
203 }
204 
206  void *HostPtr, pi_mem *RetMem,
207  const pi_mem_properties *properties) {
208  return pi2ur::piMemBufferCreate(Context, Flags, Size, HostPtr, RetMem,
209  properties);
210 }
211 
212 pi_result piMemGetInfo(pi_mem Mem, pi_mem_info ParamName, size_t ParamValueSize,
213  void *ParamValue, size_t *ParamValueSizeRet) {
214  return pi2ur::piMemGetInfo(Mem, ParamName, ParamValueSize, ParamValue,
215  ParamValueSizeRet);
216 }
217 
219 
221 
223  const pi_image_format *ImageFormat,
224  const pi_image_desc *ImageDesc, void *HostPtr,
225  pi_mem *RetImage) {
226 
227  return pi2ur::piMemImageCreate(Context, Flags, ImageFormat, ImageDesc,
228  HostPtr, RetImage);
229 }
230 
232  return pi2ur::piextMemGetNativeHandle(Mem, NativeHandle);
233 }
234 
236  pi_context Context,
237  bool ownNativeHandle, pi_mem *Mem) {
238  return pi2ur::piextMemCreateWithNativeHandle(NativeHandle, Context,
239  ownNativeHandle, Mem);
240 }
241 
242 pi_result piProgramCreate(pi_context Context, const void *ILBytes,
243  size_t Length, pi_program *Program) {
244  return pi2ur::piProgramCreate(Context, ILBytes, Length, Program);
245 }
246 
248  pi_context Context, pi_uint32 NumDevices, const pi_device *DeviceList,
249  const size_t *Lengths, const unsigned char **Binaries,
250  size_t NumMetadataEntries, const pi_device_binary_property *Metadata,
251  pi_int32 *BinaryStatus, pi_program *Program) {
252 
253  return pi2ur::piProgramCreateWithBinary(Context, NumDevices, DeviceList,
254  Lengths, Binaries, NumMetadataEntries,
255  Metadata, BinaryStatus, Program);
256 }
257 
259  pi_native_handle NativeHandle, pi_context Context, bool OwnNativeHandle,
260  const pi_image_format *ImageFormat, const pi_image_desc *ImageDesc,
261  pi_mem *Img) {
263  NativeHandle, Context, OwnNativeHandle, ImageFormat, ImageDesc, Img);
264 }
265 
267  size_t ParamValueSize, void *ParamValue,
268  size_t *ParamValueSizeRet) {
269 
270  return pi2ur::piProgramGetInfo(Program, ParamName, ParamValueSize, ParamValue,
271  ParamValueSizeRet);
272 }
273 
275  const pi_device *DeviceList, const char *Options,
276  pi_uint32 NumInputPrograms,
277  const pi_program *InputPrograms,
278  void (*PFnNotify)(pi_program Program, void *UserData),
279  void *UserData, pi_program *RetProgram) {
280  return pi2ur::piProgramLink(Context, NumDevices, DeviceList, Options,
281  NumInputPrograms, InputPrograms, PFnNotify,
282  UserData, RetProgram);
283 }
284 
286  pi_program Program, pi_uint32 NumDevices, const pi_device *DeviceList,
287  const char *Options, pi_uint32 NumInputHeaders,
288  const pi_program *InputHeaders, const char **HeaderIncludeNames,
289  void (*PFnNotify)(pi_program Program, void *UserData), void *UserData) {
290 
291  return pi2ur::piProgramCompile(Program, NumDevices, DeviceList, Options,
292  NumInputHeaders, InputHeaders,
293  HeaderIncludeNames, PFnNotify, UserData);
294 }
295 
297  const pi_device *DeviceList, const char *Options,
298  void (*PFnNotify)(pi_program Program, void *UserData),
299  void *UserData) {
300  return pi2ur::piProgramBuild(Program, NumDevices, DeviceList, Options,
301  PFnNotify, UserData);
302 }
303 
305  pi_program_build_info ParamName,
306  size_t ParamValueSize, void *ParamValue,
307  size_t *ParamValueSizeRet) {
308 
309  return pi2ur::piProgramGetBuildInfo(Program, Device, ParamName,
310  ParamValueSize, ParamValue,
311  ParamValueSizeRet);
312 }
313 
315  return pi2ur::piProgramRetain(Program);
316 }
317 
319  return pi2ur::piProgramRelease(Program);
320 }
321 
323  pi_native_handle *NativeHandle) {
324  return pi2ur::piextProgramGetNativeHandle(Program, NativeHandle);
325 }
326 
328  pi_context Context,
329  bool OwnNativeHandle,
330  pi_program *Program) {
331  return pi2ur::piextProgramCreateWithNativeHandle(NativeHandle, Context,
332  OwnNativeHandle, Program);
333 }
334 
335 pi_result piKernelCreate(pi_program Program, const char *KernelName,
336  pi_kernel *RetKernel) {
337 
338  return pi2ur::piKernelCreate(Program, KernelName, RetKernel);
339 }
340 
341 pi_result piKernelSetArg(pi_kernel Kernel, pi_uint32 ArgIndex, size_t ArgSize,
342  const void *ArgValue) {
343 
344  return pi2ur::piKernelSetArg(Kernel, ArgIndex, ArgSize, ArgValue);
345 }
346 
348  const pi_mem_obj_property *ArgProperties,
349  const pi_mem *ArgValue) {
350  return pi2ur::piextKernelSetArgMemObj(Kernel, ArgIndex, ArgProperties,
351  ArgValue);
352 }
353 
355  const pi_sampler *ArgValue) {
356 
357  return pi2ur::piextKernelSetArgSampler(Kernel, ArgIndex, ArgValue);
358 }
359 
361  size_t ParamValueSize, void *ParamValue,
362  size_t *ParamValueSizeRet) {
363 
364  return pi2ur::piKernelGetInfo(Kernel, ParamName, ParamValueSize, ParamValue,
365  ParamValueSizeRet);
366 }
367 
369  pi_device Device,
370  pi_image_format *ImageFormat,
371  pi_image_desc *ImageDesc,
372  pi_image_mem_handle *RetMem) {
373  return pi2ur::piextMemImageAllocate(Context, Device, ImageFormat, ImageDesc,
374  RetMem);
375 }
376 
378  pi_context Context, pi_device Device, pi_image_mem_handle ImgMem,
379  pi_image_format *ImageFormat, pi_image_desc *ImageDesc, pi_mem *RetMem,
380  pi_image_handle *RetHandle) {
382  Context, Device, ImgMem, ImageFormat, ImageDesc, RetMem, RetHandle);
383 }
384 
386  pi_context Context, pi_device Device, pi_image_mem_handle ImgMem,
387  pi_image_format *ImageFormat, pi_image_desc *ImageDesc, pi_sampler Sampler,
388  pi_mem *RetMem, pi_image_handle *RetHandle) {
389  return pi2ur::piextMemSampledImageCreate(Context, Device, ImgMem, ImageFormat,
390  ImageDesc, Sampler, RetMem,
391  RetHandle);
392 }
393 
395  pi_context Context, const pi_sampler_properties *SamplerProperties,
396  float MinMipmapLevelClamp, float MaxMipmapLevelClamp, float MaxAnisotropy,
397  pi_sampler *RetSampler) {
399  Context, SamplerProperties, MinMipmapLevelClamp, MaxMipmapLevelClamp,
400  MaxAnisotropy, RetSampler);
401 }
402 
404  pi_device Device,
405  pi_image_mem_handle MipMem,
406  unsigned int Level,
407  pi_image_mem_handle *RetMem) {
408  return pi2ur::piextMemMipmapGetLevel(Context, Device, MipMem, Level, RetMem);
409 }
410 
411 __SYCL_EXPORT pi_result piextMemImageFree(pi_context Context, pi_device Device,
412  pi_image_mem_handle MemoryHandle) {
413  return pi2ur::piextMemImageFree(Context, Device, MemoryHandle);
414 }
415 
416 __SYCL_EXPORT pi_result piextMemMipmapFree(pi_context Context, pi_device Device,
417  pi_image_mem_handle MemoryHandle) {
418  return pi2ur::piextMemMipmapFree(Context, Device, MemoryHandle);
419 }
420 
422  pi_queue Queue, void *DstPtr, void *SrcPtr,
423  const pi_image_format *ImageFormat, const pi_image_desc *ImageDesc,
424  const pi_image_copy_flags Flags, pi_image_offset SrcOffset,
425  pi_image_offset DstOffset, pi_image_region CopyExtent,
426  pi_image_region HostExtent, pi_uint32 NumEventsInWaitList,
427  const pi_event *EventWaitList, pi_event *Event) {
428  return pi2ur::piextMemImageCopy(Queue, DstPtr, SrcPtr, ImageFormat, ImageDesc,
429  Flags, SrcOffset, DstOffset, CopyExtent,
430  HostExtent, NumEventsInWaitList,
431  EventWaitList, Event);
432 }
433 
435  pi_context Context, pi_device Device, pi_image_handle Handle) {
436  return pi2ur::piextMemUnsampledImageHandleDestroy(Context, Device, Handle);
437 }
438 
440  pi_context Context, pi_device Device, pi_image_handle Handle) {
441  return pi2ur::piextMemSampledImageHandleDestroy(Context, Device, Handle);
442 }
443 
445  pi_image_info ParamName,
446  void *ParamValue,
447  size_t *ParamValueSizeRet) {
448  return pi2ur::piextMemImageGetInfo(MemHandle, ParamName, ParamValue,
449  ParamValueSizeRet);
450 }
451 
452 __SYCL_EXPORT pi_result
453 piextMemImportOpaqueFD(pi_context Context, pi_device Device, size_t Size,
454  int FileDescriptor, pi_interop_mem_handle *RetHandle) {
455  return pi2ur::piextMemImportOpaqueFD(Context, Device, Size, FileDescriptor,
456  RetHandle);
457 }
458 
460  pi_context Context, pi_device Device, pi_image_format *ImageFormat,
461  pi_image_desc *ImageDesc, pi_interop_mem_handle MemHandle,
462  pi_image_mem_handle *RetMem) {
463  return pi2ur::piextMemMapExternalArray(Context, Device, ImageFormat,
464  ImageDesc, MemHandle, RetMem);
465 }
466 
468  pi_device Device,
469  pi_interop_mem_handle ExtMem) {
470  return pi2ur::piextMemReleaseInterop(Context, Device, ExtMem);
471 }
472 
474  pi_context Context, pi_device Device, int FileDescriptor,
475  pi_interop_semaphore_handle *RetHandle) {
476  return pi2ur::piextImportExternalSemaphoreOpaqueFD(Context, Device,
477  FileDescriptor, RetHandle);
478 }
479 
480 __SYCL_EXPORT pi_result
482  pi_interop_semaphore_handle SemHandle) {
483  return pi2ur::piextDestroyExternalSemaphore(Context, Device, SemHandle);
484 }
485 
487  pi_queue Queue, pi_interop_semaphore_handle SemHandle,
488  pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList,
489  pi_event *Event) {
491  Queue, SemHandle, NumEventsInWaitList, EventWaitList, Event);
492 }
493 
495  pi_queue Queue, pi_interop_semaphore_handle SemHandle,
496  pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList,
497  pi_event *Event) {
499  Queue, SemHandle, NumEventsInWaitList, EventWaitList, Event);
500 }
501 
503  pi_kernel_group_info ParamName,
504  size_t ParamValueSize, void *ParamValue,
505  size_t *ParamValueSizeRet) {
506  return pi2ur::piKernelGetGroupInfo(Kernel, Device, ParamName, ParamValueSize,
507  ParamValue, ParamValueSizeRet);
508 }
509 
511  pi_kernel_sub_group_info ParamName,
512  size_t InputValueSize, const void *InputValue,
513  size_t ParamValueSize, void *ParamValue,
514  size_t *ParamValueSizeRet) {
516  Kernel, Device, ParamName, InputValueSize, InputValue, ParamValueSize,
517  ParamValue, ParamValueSizeRet);
518 }
519 
521 
522  return pi2ur::piKernelRetain(Kernel);
523 }
524 
526 
527  return pi2ur::piKernelRelease(Kernel);
528 }
529 
530 pi_result
532  const size_t *GlobalWorkOffset,
533  const size_t *GlobalWorkSize, const size_t *LocalWorkSize,
534  pi_uint32 NumEventsInWaitList,
535  const pi_event *EventWaitList, pi_event *OutEvent) {
537  Queue, Kernel, WorkDim, GlobalWorkOffset, GlobalWorkSize, LocalWorkSize,
538  NumEventsInWaitList, EventWaitList, OutEvent);
539 }
540 
542  pi_context Context,
543  pi_program Program,
544  bool OwnNativeHandle,
545  pi_kernel *Kernel) {
546 
548  NativeHandle, Context, Program, OwnNativeHandle, Kernel);
549 }
550 
552  pi_native_handle *NativeHandle) {
553  return pi2ur::piextKernelGetNativeHandle(Kernel, NativeHandle);
554 }
555 
557  return pi2ur::piEventCreate(Context, RetEvent);
558 }
559 
561  size_t ParamValueSize, void *ParamValue,
562  size_t *ParamValueSizeRet) {
563  return pi2ur::piEventGetInfo(Event, ParamName, ParamValueSize, ParamValue,
564  ParamValueSizeRet);
565 }
566 
568  size_t ParamValueSize, void *ParamValue,
569  size_t *ParamValueSizeRet) {
570 
571  return pi2ur::piEventGetProfilingInfo(Event, ParamName, ParamValueSize,
572  ParamValue, ParamValueSizeRet);
573 }
574 
575 pi_result piEventsWait(pi_uint32 NumEvents, const pi_event *EventList) {
576  return pi2ur::piEventsWait(NumEvents, EventList);
577 }
578 
579 pi_result piEventSetCallback(pi_event Event, pi_int32 CommandExecCallbackType,
580  void (*PFnNotify)(pi_event Event,
581  pi_int32 EventCommandStatus,
582  void *UserData),
583  void *UserData) {
584  return pi2ur::piEventSetCallback(Event, CommandExecCallbackType, PFnNotify,
585  UserData);
586 }
587 
588 pi_result piEventSetStatus(pi_event Event, pi_int32 ExecutionStatus) {
589  return pi2ur::piEventSetStatus(Event, ExecutionStatus);
590 }
591 
593 
595  return pi2ur::piEventRelease(Event);
596 }
597 
599  pi_native_handle *NativeHandle) {
600 
601  return pi2ur::piextEventGetNativeHandle(Event, NativeHandle);
602 }
603 
605  pi_context Context,
606  bool OwnNativeHandle,
607  pi_event *Event) {
608  return pi2ur::piextEventCreateWithNativeHandle(NativeHandle, Context,
609  OwnNativeHandle, Event);
610 }
611 
613  const pi_sampler_properties *SamplerProperties,
614  pi_sampler *RetSampler) {
615  return pi2ur::piSamplerCreate(Context, SamplerProperties, RetSampler);
616 }
617 
619  size_t ParamValueSize, void *ParamValue,
620  size_t *ParamValueSizeRet) {
621 
622  return pi2ur::piSamplerGetInfo(Sampler, ParamName, ParamValueSize, ParamValue,
623  ParamValueSizeRet);
624 }
625 
627  return pi2ur::piSamplerRetain(Sampler);
628 }
629 
631  return pi2ur::piSamplerRelease(Sampler);
632 }
633 
634 pi_result piEnqueueEventsWait(pi_queue Queue, pi_uint32 NumEventsInWaitList,
635  const pi_event *EventWaitList,
636  pi_event *OutEvent) {
637 
638  return pi2ur::piEnqueueEventsWait(Queue, NumEventsInWaitList, EventWaitList,
639  OutEvent);
640 }
641 
643  pi_uint32 NumEventsInWaitList,
644  const pi_event *EventWaitList,
645  pi_event *OutEvent) {
646 
647  return pi2ur::piEnqueueEventsWaitWithBarrier(Queue, NumEventsInWaitList,
648  EventWaitList, OutEvent);
649 }
650 
652  pi_bool BlockingRead, size_t Offset,
653  size_t Size, void *Dst,
654  pi_uint32 NumEventsInWaitList,
655  const pi_event *EventWaitList,
656  pi_event *Event) {
657 
658  return pi2ur::piEnqueueMemBufferRead(Queue, Src, BlockingRead, Offset, Size,
659  Dst, NumEventsInWaitList, EventWaitList,
660  Event);
661 }
662 
664  pi_queue Queue, pi_mem Buffer, pi_bool BlockingRead,
665  pi_buff_rect_offset BufferOffset, pi_buff_rect_offset HostOffset,
666  pi_buff_rect_region Region, size_t BufferRowPitch, size_t BufferSlicePitch,
667  size_t HostRowPitch, size_t HostSlicePitch, void *Ptr,
668  pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList,
669  pi_event *Event) {
670 
672  Queue, Buffer, BlockingRead, BufferOffset, HostOffset, Region,
673  BufferRowPitch, BufferSlicePitch, HostRowPitch, HostSlicePitch, Ptr,
674  NumEventsInWaitList, EventWaitList, Event);
675 }
676 
678  pi_bool BlockingWrite, size_t Offset,
679  size_t Size, const void *Ptr,
680  pi_uint32 NumEventsInWaitList,
681  const pi_event *EventWaitList,
682  pi_event *Event) {
683 
684  return pi2ur::piEnqueueMemBufferWrite(Queue, Buffer, BlockingWrite, Offset,
685  Size, Ptr, NumEventsInWaitList,
686  EventWaitList, Event);
687 }
688 
690  pi_queue Queue, pi_mem Buffer, pi_bool BlockingWrite,
691  pi_buff_rect_offset BufferOffset, pi_buff_rect_offset HostOffset,
692  pi_buff_rect_region Region, size_t BufferRowPitch, size_t BufferSlicePitch,
693  size_t HostRowPitch, size_t HostSlicePitch, const void *Ptr,
694  pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList,
695  pi_event *Event) {
696 
698  Queue, Buffer, BlockingWrite, BufferOffset, HostOffset, Region,
699  BufferRowPitch, BufferSlicePitch, HostRowPitch, HostSlicePitch, Ptr,
700  NumEventsInWaitList, EventWaitList, Event);
701 }
702 
704  size_t SrcOffset, size_t DstOffset,
705  size_t Size, pi_uint32 NumEventsInWaitList,
706  const pi_event *EventWaitList,
707  pi_event *Event) {
708 
709  return pi2ur::piEnqueueMemBufferCopy(Queue, SrcMem, DstMem, SrcOffset,
710  DstOffset, Size, NumEventsInWaitList,
711  EventWaitList, Event);
712 }
713 
715  pi_queue Queue, pi_mem SrcMem, pi_mem DstMem, pi_buff_rect_offset SrcOrigin,
716  pi_buff_rect_offset DstOrigin, pi_buff_rect_region Region,
717  size_t SrcRowPitch, size_t SrcSlicePitch, size_t DstRowPitch,
718  size_t DstSlicePitch, pi_uint32 NumEventsInWaitList,
719  const pi_event *EventWaitList, pi_event *Event) {
720 
722  Queue, SrcMem, DstMem, SrcOrigin, DstOrigin, Region, SrcRowPitch,
723  SrcSlicePitch, DstRowPitch, DstSlicePitch, NumEventsInWaitList,
724  EventWaitList, Event);
725 }
726 
728  const void *Pattern, size_t PatternSize,
729  size_t Offset, size_t Size,
730  pi_uint32 NumEventsInWaitList,
731  const pi_event *EventWaitList,
732  pi_event *Event) {
733 
734  return pi2ur::piEnqueueMemBufferFill(Queue, Buffer, Pattern, PatternSize,
735  Offset, Size, NumEventsInWaitList,
736  EventWaitList, Event);
737 }
738 
740  pi_map_flags MapFlags, size_t Offset,
741  size_t Size, pi_uint32 NumEventsInWaitList,
742  const pi_event *EventWaitList,
743  pi_event *OutEvent, void **RetMap) {
744 
745  return pi2ur::piEnqueueMemBufferMap(Queue, Mem, BlockingMap, MapFlags, Offset,
746  Size, NumEventsInWaitList, EventWaitList,
747  OutEvent, RetMap);
748 }
749 
750 pi_result piEnqueueMemUnmap(pi_queue Queue, pi_mem Mem, void *MappedPtr,
751  pi_uint32 NumEventsInWaitList,
752  const pi_event *EventWaitList, pi_event *OutEvent) {
753 
754  return pi2ur::piEnqueueMemUnmap(Queue, Mem, MappedPtr, NumEventsInWaitList,
755  EventWaitList, OutEvent);
756 }
757 
759  size_t ParamValueSize, void *ParamValue,
760  size_t *ParamValueSizeRet) {
761 
762  return pi2ur::piMemImageGetInfo(Image, ParamName, ParamValueSize, ParamValue,
763  ParamValueSizeRet);
764 }
765 
767  pi_bool BlockingRead, pi_image_offset Origin,
768  pi_image_region Region, size_t RowPitch,
769  size_t SlicePitch, void *Ptr,
770  pi_uint32 NumEventsInWaitList,
771  const pi_event *EventWaitList,
772  pi_event *Event) {
774  Queue, Image, BlockingRead, Origin, Region, RowPitch, SlicePitch, Ptr,
775  NumEventsInWaitList, EventWaitList, Event);
776 }
777 
779  pi_bool BlockingWrite, pi_image_offset Origin,
780  pi_image_region Region, size_t InputRowPitch,
781  size_t InputSlicePitch, const void *Ptr,
782  pi_uint32 NumEventsInWaitList,
783  const pi_event *EventWaitList,
784  pi_event *Event) {
785 
787  Queue, Image, BlockingWrite, Origin, Region, InputRowPitch,
788  InputSlicePitch, Ptr, NumEventsInWaitList, EventWaitList, Event);
789 }
790 
791 pi_result
792 piEnqueueMemImageCopy(pi_queue Queue, pi_mem SrcImage, pi_mem DstImage,
793  pi_image_offset SrcOrigin, pi_image_offset DstOrigin,
794  pi_image_region Region, pi_uint32 NumEventsInWaitList,
795  const pi_event *EventWaitList, pi_event *Event) {
796  return pi2ur::piEnqueueMemImageCopy(Queue, SrcImage, DstImage, SrcOrigin,
797  DstOrigin, Region, NumEventsInWaitList,
798  EventWaitList, Event);
799 }
800 
802  const void *FillColor, const size_t *Origin,
803  const size_t *Region,
804  pi_uint32 NumEventsInWaitList,
805  const pi_event *EventWaitList,
806  pi_event *Event) {
807 
808  return pi2ur::piEnqueueMemImageFill(Queue, Image, FillColor, Origin, Region,
809  NumEventsInWaitList, EventWaitList,
810  Event);
811 }
812 
814  pi_buffer_create_type BufferCreateType,
815  void *BufferCreateInfo, pi_mem *RetMem) {
816 
817  return pi2ur::piMemBufferPartition(Buffer, Flags, BufferCreateType,
818  BufferCreateInfo, RetMem);
819 }
820 
822  const char *FunctionName,
823  pi_uint64 *FunctionPointerRet) {
824  return pi2ur::piextGetDeviceFunctionPointer(Device, Program, FunctionName,
825  FunctionPointerRet);
826 }
827 
828 pi_result piextUSMDeviceAlloc(void **ResultPtr, pi_context Context,
829  pi_device Device,
830  pi_usm_mem_properties *Properties, size_t Size,
832 
833  return pi2ur::piextUSMDeviceAlloc(ResultPtr, Context, Device, Properties,
834  Size, Alignment);
835 }
836 
837 pi_result piextUSMSharedAlloc(void **ResultPtr, pi_context Context,
838  pi_device Device,
839  pi_usm_mem_properties *Properties, size_t Size,
841 
842  return pi2ur::piextUSMSharedAlloc(ResultPtr, Context, Device, Properties,
843  Size, Alignment);
844 }
845 
847  void **ResultPtr, size_t *ResultPitch, pi_context Context, pi_device Device,
848  pi_usm_mem_properties *Properties, size_t WidthInBytes, size_t Height,
849  unsigned int ElementSizeBytes) {
850 
851  return pi2ur::piextUSMPitchedAlloc(ResultPtr, ResultPitch, Context, Device,
852  Properties, WidthInBytes, Height,
853  ElementSizeBytes);
854 }
855 
856 pi_result piextUSMHostAlloc(void **ResultPtr, pi_context Context,
857  pi_usm_mem_properties *Properties, size_t Size,
859  return pi2ur::piextUSMHostAlloc(ResultPtr, Context, Properties, Size,
860  Alignment);
861 }
862 
863 pi_result piextUSMFree(pi_context Context, void *Ptr) {
864 
865  return pi2ur::piextUSMFree(Context, Ptr);
866 }
867 
869  size_t ArgSize, const void *ArgValue) {
870  return pi2ur::piextKernelSetArgPointer(Kernel, ArgIndex, ArgSize, ArgValue);
871 }
872 
874  size_t Count, pi_uint32 NumEventsInWaitlist,
875  const pi_event *EventsWaitlist,
876  pi_event *Event) {
878  Queue, Ptr, Value, Count, NumEventsInWaitlist, EventsWaitlist, Event);
879 }
880 
881 pi_result piextUSMEnqueueMemcpy(pi_queue Queue, pi_bool Blocking, void *DstPtr,
882  const void *SrcPtr, size_t Size,
883  pi_uint32 NumEventsInWaitlist,
884  const pi_event *EventsWaitlist,
885  pi_event *Event) {
886 
887  return pi2ur::piextUSMEnqueueMemcpy(Queue, Blocking, DstPtr, SrcPtr, Size,
888  NumEventsInWaitlist, EventsWaitlist,
889  Event);
890 }
891 
892 pi_result piextUSMEnqueuePrefetch(pi_queue Queue, const void *Ptr, size_t Size,
894  pi_uint32 NumEventsInWaitList,
895  const pi_event *EventWaitList,
896  pi_event *OutEvent) {
897 
899  Queue, Ptr, Size, Flags, NumEventsInWaitList, EventWaitList, OutEvent);
900 }
901 
903  size_t Length, pi_mem_advice Advice,
904  pi_event *OutEvent) {
905 
906  return pi2ur::piextUSMEnqueueMemAdvise(Queue, Ptr, Length, Advice, OutEvent);
907 }
908 
909 __SYCL_EXPORT pi_result piextUSMEnqueueFill2D(pi_queue Queue, void *Ptr,
910  size_t Pitch, size_t PatternSize,
911  const void *Pattern, size_t Width,
912  size_t Height,
913  pi_uint32 NumEventsWaitList,
914  const pi_event *EventsWaitList,
915  pi_event *Event) {
916 
917  return pi2ur::piextUSMEnqueueFill2D(Queue, Ptr, Pitch, PatternSize, Pattern,
918  Width, Height, NumEventsWaitList,
919  EventsWaitList, Event);
920 }
921 
922 __SYCL_EXPORT pi_result piextUSMEnqueueMemset2D(pi_queue Queue, void *Ptr,
923  size_t Pitch, int Value,
924  size_t Width, size_t Height,
925  pi_uint32 NumEventsWaitList,
926  const pi_event *EventsWaitlist,
927  pi_event *Event) {
928 
929  return pi2ur::piextUSMEnqueueMemset2D(Queue, Ptr, Pitch, Value, Width, Height,
930  NumEventsWaitList, EventsWaitlist,
931  Event);
932 }
933 
935  pi_queue Queue, pi_bool Blocking, void *DstPtr, size_t DstPitch,
936  const void *SrcPtr, size_t SrcPitch, size_t Width, size_t Height,
937  pi_uint32 NumEventsInWaitlist, const pi_event *EventWaitlist,
938  pi_event *Event) {
939 
941  Queue, Blocking, DstPtr, DstPitch, SrcPtr, SrcPitch, Width, Height,
942  NumEventsInWaitlist, EventWaitlist, Event);
943 }
944 
946  pi_mem_alloc_info ParamName,
947  size_t ParamValueSize, void *ParamValue,
948  size_t *ParamValueSizeRet) {
949  return pi2ur::piextUSMGetMemAllocInfo(Context, Ptr, ParamName, ParamValueSize,
950  ParamValue, ParamValueSizeRet);
951 }
952 
953 pi_result piextUSMImport(const void *HostPtr, size_t Size, pi_context Context) {
954  return pi2ur::piextUSMImport(HostPtr, Size, Context);
955 }
956 
957 pi_result piextUSMRelease(const void *HostPtr, pi_context Context) {
958  return pi2ur::piextUSMRelease(HostPtr, Context);
959 }
960 
962  pi_queue Queue, pi_program Program, const char *Name, pi_bool BlockingWrite,
963  size_t Count, size_t Offset, const void *Src, pi_uint32 NumEventsInWaitList,
964  const pi_event *EventsWaitList, pi_event *Event) {
966  Queue, Program, Name, BlockingWrite, Count, Offset, Src,
967  NumEventsInWaitList, EventsWaitList, Event);
968 }
969 
971  pi_queue Queue, pi_program Program, const char *Name, pi_bool BlockingRead,
972  size_t Count, size_t Offset, void *Dst, pi_uint32 NumEventsInWaitList,
973  const pi_event *EventsWaitList, pi_event *Event) {
975  Queue, Program, Name, BlockingRead, Count, Offset, Dst,
976  NumEventsInWaitList, EventsWaitList, Event);
977 
978  return PI_SUCCESS;
979 }
980 
982  const char *PipeSymbol, pi_bool Blocking,
983  void *Ptr, size_t Size,
984  pi_uint32 NumEventsInWaitList,
985  const pi_event *EventsWaitList,
986  pi_event *Event) {
987  (void)Queue;
988  (void)Program;
989  (void)PipeSymbol;
990  (void)Blocking;
991  (void)Ptr;
992  (void)Size;
993  (void)NumEventsInWaitList;
994  (void)EventsWaitList;
995  (void)Event;
996  PI_ASSERT(Queue, PI_ERROR_INVALID_QUEUE);
997  die("piextEnqueueReadHostPipe: not implemented");
998  return {};
999 }
1000 
1002  const char *PipeSymbol, pi_bool Blocking,
1003  void *Ptr, size_t Size,
1004  pi_uint32 NumEventsInWaitList,
1005  const pi_event *EventsWaitList,
1006  pi_event *Event) {
1007  (void)Queue;
1008  (void)Program;
1009  (void)PipeSymbol;
1010  (void)Blocking;
1011  (void)Ptr;
1012  (void)Size;
1013  (void)NumEventsInWaitList;
1014  (void)EventsWaitList;
1015  (void)Event;
1016  PI_ASSERT(Queue, PI_ERROR_INVALID_QUEUE);
1017  die("piextEnqueueWriteHostPipe: not implemented");
1018  return {};
1019 }
1020 
1022  size_t ParamValueSize, const void *ParamValue) {
1023 
1024  return pi2ur::piKernelSetExecInfo(Kernel, ParamName, ParamValueSize,
1025  ParamValue);
1026 }
1027 
1029  pi_uint32 SpecID, size_t Size,
1030  const void *SpecValue) {
1031  return pi2ur::piextProgramSetSpecializationConstant(Prog, SpecID, Size,
1032  SpecValue);
1033 }
1034 
1035 // Command buffer extension
1037  const pi_ext_command_buffer_desc *Desc,
1038  pi_ext_command_buffer *RetCommandBuffer) {
1039  return pi2ur::piextCommandBufferCreate(Context, Device, Desc,
1040  RetCommandBuffer);
1041 }
1042 
1044  return pi2ur::piextCommandBufferRetain(CommandBuffer);
1045 }
1046 
1048  return pi2ur::piextCommandBufferRelease(CommandBuffer);
1049 }
1050 
1052  return pi2ur::piextCommandBufferFinalize(CommandBuffer);
1053 }
1054 
1056  pi_ext_command_buffer CommandBuffer, pi_kernel Kernel, pi_uint32 WorkDim,
1057  const size_t *GlobalWorkOffset, const size_t *GlobalWorkSize,
1058  const size_t *LocalWorkSize, pi_uint32 NumSyncPointsInWaitList,
1059  const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint) {
1061  CommandBuffer, Kernel, WorkDim, GlobalWorkOffset, GlobalWorkSize,
1062  LocalWorkSize, NumSyncPointsInWaitList, SyncPointWaitList, SyncPoint);
1063 }
1064 
1066  pi_ext_command_buffer CommandBuffer, void *DstPtr, const void *SrcPtr,
1067  size_t Size, pi_uint32 NumSyncPointsInWaitList,
1068  const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint) {
1069  return pi2ur::piextCommandBufferMemcpyUSM(CommandBuffer, DstPtr, SrcPtr, Size,
1070  NumSyncPointsInWaitList,
1071  SyncPointWaitList, SyncPoint);
1072 }
1073 
1075  pi_ext_command_buffer CommandBuffer, pi_mem SrcMem, pi_mem DstMem,
1076  size_t SrcOffset, size_t DstOffset, size_t Size,
1077  pi_uint32 NumSyncPointsInWaitList,
1078  const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint) {
1080  CommandBuffer, SrcMem, DstMem, SrcOffset, DstOffset, Size,
1081  NumSyncPointsInWaitList, SyncPointWaitList, SyncPoint);
1082 }
1083 
1085  pi_ext_command_buffer CommandBuffer, pi_mem SrcMem, pi_mem DstMem,
1086  pi_buff_rect_offset SrcOrigin, pi_buff_rect_offset DstOrigin,
1087  pi_buff_rect_region Region, size_t SrcRowPitch, size_t SrcSlicePitch,
1088  size_t DstRowPitch, size_t DstSlicePitch, pi_uint32 NumSyncPointsInWaitList,
1089  const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint) {
1091  CommandBuffer, SrcMem, DstMem, SrcOrigin, DstOrigin, Region, SrcRowPitch,
1092  SrcSlicePitch, DstRowPitch, DstSlicePitch, NumSyncPointsInWaitList,
1093  SyncPointWaitList, SyncPoint);
1094 }
1095 
1097  pi_ext_command_buffer CommandBuffer, pi_mem Buffer, size_t Offset,
1098  size_t Size, void *Dst, pi_uint32 NumSyncPointsInWaitList,
1099  const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint) {
1101  CommandBuffer, Buffer, Offset, Size, Dst, NumSyncPointsInWaitList,
1102  SyncPointWaitList, SyncPoint);
1103 }
1104 
1106  pi_ext_command_buffer CommandBuffer, pi_mem Buffer,
1107  pi_buff_rect_offset BufferOffset, pi_buff_rect_offset HostOffset,
1108  pi_buff_rect_region Region, size_t BufferRowPitch, size_t BufferSlicePitch,
1109  size_t HostRowPitch, size_t HostSlicePitch, void *Ptr,
1110  pi_uint32 NumSyncPointsInWaitList,
1111  const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint) {
1113  CommandBuffer, Buffer, BufferOffset, HostOffset, Region, BufferRowPitch,
1114  BufferSlicePitch, HostRowPitch, HostSlicePitch, Ptr,
1115  NumSyncPointsInWaitList, SyncPointWaitList, SyncPoint);
1116 }
1117 
1119  pi_ext_command_buffer CommandBuffer, pi_mem Buffer, size_t Offset,
1120  size_t Size, const void *Ptr, pi_uint32 NumSyncPointsInWaitList,
1121  const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint) {
1123  CommandBuffer, Buffer, Offset, Size, Ptr, NumSyncPointsInWaitList,
1124  SyncPointWaitList, SyncPoint);
1125 }
1126 
1128  pi_ext_command_buffer CommandBuffer, pi_mem Buffer,
1129  pi_buff_rect_offset BufferOffset, pi_buff_rect_offset HostOffset,
1130  pi_buff_rect_region Region, size_t BufferRowPitch, size_t BufferSlicePitch,
1131  size_t HostRowPitch, size_t HostSlicePitch, const void *Ptr,
1132  pi_uint32 NumSyncPointsInWaitList,
1133  const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint) {
1135  CommandBuffer, Buffer, BufferOffset, HostOffset, Region, BufferRowPitch,
1136  BufferSlicePitch, HostRowPitch, HostSlicePitch, Ptr,
1137  NumSyncPointsInWaitList, SyncPointWaitList, SyncPoint);
1138 }
1139 
1141  pi_queue Queue,
1142  pi_uint32 NumEventsInWaitList,
1143  const pi_event *EventWaitList,
1144  pi_event *Event) {
1146  CommandBuffer, Queue, NumEventsInWaitList, EventWaitList, Event);
1147 }
1148 
1149 pi_result piextPluginGetOpaqueData(void *opaque_data_param,
1150  void **opaque_data_return) {
1151  return pi2ur::piextPluginGetOpaqueData(opaque_data_param, opaque_data_return);
1152 }
1153 
1154 pi_result piTearDown(void *PluginParameter) {
1155  return pi2ur::piTearDown(PluginParameter);
1156 }
1157 
1158 pi_result piGetDeviceAndHostTimer(pi_device Device, uint64_t *DeviceTime,
1159  uint64_t *HostTime) {
1160  return pi2ur::piGetDeviceAndHostTimer(Device, DeviceTime, HostTime);
1161 }
1162 
1164  pi_device peer_device) {
1165 
1166  return pi2ur::piextEnablePeerAccess(command_device, peer_device);
1167 }
1168 
1170  pi_device peer_device) {
1171 
1172  return pi2ur::piextDisablePeerAccess(command_device, peer_device);
1173 }
1174 
1176  pi_device peer_device, pi_peer_attr attr,
1177  size_t ParamValueSize, void *ParamValue,
1178  size_t *ParamValueSizeRet) {
1179  return pi2ur::piextPeerAccessGetInfo(command_device, peer_device, attr,
1180  ParamValueSize, ParamValue,
1181  ParamValueSizeRet);
1182 }
1183 
1185 
1187  // Check that the major version matches in PiVersion and SupportedVersion
1189 
1190  // PI interface supports higher version or the same version.
1191  size_t PluginVersionSize = sizeof(PluginInit->PluginVersion);
1192  if (strlen(SupportedVersion) >= PluginVersionSize)
1193  return PI_ERROR_INVALID_VALUE;
1194  strncpy(PluginInit->PluginVersion, SupportedVersion, PluginVersionSize);
1195 
1196  // Set whole function table to zero to make it easier to detect if
1197  // functions are not set up below.
1198  std::memset(&(PluginInit->PiFunctionTable), 0,
1199  sizeof(PluginInit->PiFunctionTable));
1200 
1202 
1203 // Forward calls to CUDA RT.
1204 #define _PI_API(api) \
1205  (PluginInit->PiFunctionTable).api = (decltype(&::api))(&api);
1206 #include <sycl/detail/pi.def>
1207 #undef _PI_API
1208 
1209  return PI_SUCCESS;
1210 }
1211 
1212 #ifdef _WIN32
1213 #define __SYCL_PLUGIN_DLL_NAME "pi_cuda.dll"
1214 #include "../common_win_pi_trace/common_win_pi_trace.hpp"
1215 #undef __SYCL_PLUGIN_DLL_NAME
1216 #endif
1217 
1218 } // extern "C"
pi2ur::piextUSMPitchedAlloc
pi_result piextUSMPitchedAlloc(void **ResultPtr, size_t *ResultPitch, pi_context Context, pi_device Device, pi_usm_mem_properties *Properties, size_t WidthInBytes, size_t Height, unsigned int ElementSizeBytes)
Allocates memory accessible on device.
Definition: pi2ur.hpp:3127
piextProgramGetNativeHandle
pi_result piextProgramGetNativeHandle(pi_program Program, pi_native_handle *NativeHandle)
Gets the native handle of a PI program object.
Definition: pi_cuda.cpp:322
piSamplerRelease
pi_result piSamplerRelease(pi_sampler Sampler)
Definition: pi_cuda.cpp:630
piextGetDeviceFunctionPointer
pi_result piextGetDeviceFunctionPointer(pi_device Device, pi_program Program, const char *FunctionName, pi_uint64 *FunctionPointerRet)
Retrieves a device function pointer to a user-defined function.
Definition: pi_cuda.cpp:821
pi2ur::piextCommandBufferMemBufferWriteRect
pi_result piextCommandBufferMemBufferWriteRect(pi_ext_command_buffer CommandBuffer, pi_mem Buffer, pi_buff_rect_offset BufferOffset, pi_buff_rect_offset HostOffset, pi_buff_rect_region Region, size_t BufferRowPitch, size_t BufferSlicePitch, size_t HostRowPitch, size_t HostSlicePitch, const void *Ptr, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a rectangular mem buffer write command to the command-buffer.
Definition: pi2ur.hpp:4453
piextCommandBufferMemBufferWriteRect
pi_result piextCommandBufferMemBufferWriteRect(pi_ext_command_buffer CommandBuffer, pi_mem Buffer, pi_buff_rect_offset BufferOffset, pi_buff_rect_offset HostOffset, pi_buff_rect_region Region, size_t BufferRowPitch, size_t BufferSlicePitch, size_t HostRowPitch, size_t HostSlicePitch, const void *Ptr, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a rectangular mem buffer write command to the command-buffer.
Definition: pi_cuda.cpp:1127
piextUSMEnqueueMemcpy
pi_result piextUSMEnqueueMemcpy(pi_queue Queue, pi_bool Blocking, void *DstPtr, const void *SrcPtr, size_t Size, pi_uint32 NumEventsInWaitlist, const pi_event *EventsWaitlist, pi_event *Event)
USM Memcpy API.
Definition: pi_cuda.cpp:881
_pi_mem
Definition: pi_cuda.hpp:56
pi2ur::piKernelSetArg
pi_result piKernelSetArg(pi_kernel Kernel, pi_uint32 ArgIndex, size_t ArgSize, const void *ArgValue)
Definition: pi2ur.hpp:2189
piextCommandBufferRetain
pi_result piextCommandBufferRetain(pi_ext_command_buffer CommandBuffer)
API to increment the reference count of the command-buffer.
Definition: pi_cuda.cpp:1043
pi2ur::piextSignalExternalSemaphore
pi_result piextSignalExternalSemaphore(pi_queue Queue, pi_interop_semaphore_handle SemHandle, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
API to instruct the queue to signal the external semaphore handle once all previous commands have com...
Definition: pi2ur.hpp:5059
pi2ur::piEventGetProfilingInfo
pi_result piEventGetProfilingInfo(pi_event Event, pi_profiling_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi2ur.hpp:4023
pi2ur::piKernelGetGroupInfo
pi_result piKernelGetGroupInfo(pi_kernel Kernel, pi_device Device, pi_kernel_group_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi2ur.hpp:2372
piEnqueueKernelLaunch
pi_result piEnqueueKernelLaunch(pi_queue Queue, pi_kernel Kernel, pi_uint32 WorkDim, const size_t *GlobalWorkOffset, const size_t *GlobalWorkSize, const size_t *LocalWorkSize, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *OutEvent)
Definition: pi_cuda.cpp:531
piextPlatformCreateWithNativeHandle
pi_result piextPlatformCreateWithNativeHandle(pi_native_handle NativeHandle, pi_platform *Platform)
Creates PI platform object from a native handle.
Definition: pi_cuda.cpp:42
piextUSMImport
pi_result piextUSMImport(const void *HostPtr, size_t Size, pi_context Context)
Import host system memory into USM.
Definition: pi_cuda.cpp:953
piextEnqueueReadHostPipe
pi_result piextEnqueueReadHostPipe(pi_queue Queue, pi_program Program, const char *PipeSymbol, pi_bool Blocking, void *Ptr, size_t Size, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *Event)
Plugin.
Definition: pi_cuda.cpp:981
_pi_context_info
_pi_context_info
Definition: pi.h:448
pi_buff_rect_offset_struct
Definition: pi.h:1016
piEnqueueEventsWaitWithBarrier
pi_result piEnqueueEventsWaitWithBarrier(pi_queue Queue, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *OutEvent)
Definition: pi_cuda.cpp:642
pi2ur::piKernelRelease
pi_result piKernelRelease(pi_kernel Kernel)
Definition: pi2ur.hpp:2439
piMemImageCreate
pi_result piMemImageCreate(pi_context Context, pi_mem_flags Flags, const pi_image_format *ImageFormat, const pi_image_desc *ImageDesc, void *HostPtr, pi_mem *RetImage)
Definition: pi_cuda.cpp:222
piDeviceRetain
pi_result piDeviceRetain(pi_device Device)
Definition: pi_cuda.cpp:65
pi2ur::piPlatformGetInfo
pi_result piPlatformGetInfo(pi_platform Platform, pi_platform_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi2ur.hpp:854
pi2ur::piProgramRetain
pi_result piProgramRetain(pi_program Program)
Definition: pi2ur.hpp:2238
piProgramRelease
pi_result piProgramRelease(pi_program Program)
Definition: pi_cuda.cpp:318
piEventRelease
pi_result piEventRelease(pi_event Event)
Definition: pi_cuda.cpp:594
pi_bool
pi_uint32 pi_bool
Definition: pi.h:196
pi2ur::piEventRetain
pi_result piEventRetain(pi_event Event)
Definition: pi2ur.hpp:4120
pi2ur::piextUSMGetMemAllocInfo
pi_result piextUSMGetMemAllocInfo(pi_context Context, const void *Ptr, pi_mem_alloc_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
API to query information about USM allocated pointers Valid Queries: PI_MEM_ALLOC_TYPE returns host/d...
Definition: pi2ur.hpp:3351
piextUSMEnqueueMemset
pi_result piextUSMEnqueueMemset(pi_queue Queue, void *Ptr, pi_int32 Value, size_t Count, pi_uint32 NumEventsInWaitlist, const pi_event *EventsWaitlist, pi_event *Event)
USM Memset API.
Definition: pi_cuda.cpp:873
pi2ur::piextCommandBufferMemcpyUSM
pi_result piextCommandBufferMemcpyUSM(pi_ext_command_buffer CommandBuffer, void *DstPtr, const void *SrcPtr, size_t Size, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a USM memcpy command to the command-buffer.
Definition: pi2ur.hpp:4345
piextMemReleaseInterop
pi_result piextMemReleaseInterop(pi_context Context, pi_device Device, pi_interop_mem_handle ExtMem)
API to destroy interop memory.
Definition: pi_cuda.cpp:467
piextCommandBufferFinalize
pi_result piextCommandBufferFinalize(pi_ext_command_buffer CommandBuffer)
API to stop command-buffer recording such that no more commands can be appended, and makes the comman...
Definition: pi_cuda.cpp:1051
pi2ur::piextCommandBufferMemBufferCopyRect
pi_result piextCommandBufferMemBufferCopyRect(pi_ext_command_buffer CommandBuffer, pi_mem SrcMem, pi_mem DstMem, pi_buff_rect_offset SrcOrigin, pi_buff_rect_offset DstOrigin, pi_buff_rect_region Region, size_t SrcRowPitch, size_t SrcSlicePitch, size_t DstRowPitch, size_t DstSlicePitch, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a rectangular mem buffer copy command to the command-buffer.
Definition: pi2ur.hpp:4377
piEnqueueMemImageFill
pi_result piEnqueueMemImageFill(pi_queue Queue, pi_mem Image, const void *FillColor, const size_t *Origin, const size_t *Region, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
Definition: pi_cuda.cpp:801
piMemRelease
pi_result piMemRelease(pi_mem Mem)
Definition: pi_cuda.cpp:220
pi2ur::piextPlatformCreateWithNativeHandle
pi_result piextPlatformCreateWithNativeHandle(pi_native_handle NativeHandle, pi_platform *Platform)
Creates PI platform object from a native handle.
Definition: pi2ur.hpp:837
pi2ur::piextMemImageCreateWithNativeHandle
pi_result piextMemImageCreateWithNativeHandle(pi_native_handle NativeHandle, pi_context Context, bool OwnNativeHandle, const pi_image_format *ImageFormat, const pi_image_desc *ImageDesc, pi_mem *RetImage)
Creates PI image object from a native handle.
Definition: pi2ur.hpp:2966
piextProgramSetSpecializationConstant
pi_result piextProgramSetSpecializationConstant(pi_program Prog, pi_uint32 SpecID, size_t Size, const void *SpecValue)
Sets a specialization constant to a specific value.
Definition: pi_cuda.cpp:1028
pi2ur::piEnqueueMemBufferMap
pi_result piEnqueueMemBufferMap(pi_queue Queue, pi_mem Mem, pi_bool BlockingMap, pi_map_flags MapFlags, size_t Offset, size_t Size, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent, void **RetMap)
Definition: pi2ur.hpp:3588
pi2ur::piextProgramGetNativeHandle
pi_result piextProgramGetNativeHandle(pi_program Program, pi_native_handle *NativeHandle)
Gets the native handle of a PI program object.
Definition: pi2ur.hpp:2294
pi2ur::piSamplerCreate
pi_result piSamplerCreate(pi_context Context, const pi_sampler_properties *SamplerProperties, pi_sampler *RetSampler)
Definition: pi2ur.hpp:4143
enableCUDATracing
void enableCUDATracing()
Definition: tracing.cpp:70
piextKernelSetArgSampler
pi_result piextKernelSetArgSampler(pi_kernel Kernel, pi_uint32 ArgIndex, const pi_sampler *ArgValue)
Definition: pi_cuda.cpp:354
_pi_plugin
Definition: pi.h:2694
piEnqueueEventsWait
pi_result piEnqueueEventsWait(pi_queue Queue, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *OutEvent)
Definition: pi_cuda.cpp:634
pi2ur::piextDeviceGetNativeHandle
pi_result piextDeviceGetNativeHandle(pi_device Device, pi_native_handle *NativeHandle)
Gets the native handle of a PI device object.
Definition: pi2ur.hpp:1282
pi2ur::piEventsWait
pi_result piEventsWait(pi_uint32 NumEvents, const pi_event *EventsWaitList)
Definition: pi2ur.hpp:3965
_pi_image_copy_flags
_pi_image_copy_flags
Definition: pi.h:619
piPluginGetLastError
pi_result piPluginGetLastError(char **message)
API to get Plugin specific warning and error messages.
Definition: pi_cuda.cpp:47
pi2ur::piextEventCreateWithNativeHandle
pi_result piextEventCreateWithNativeHandle(pi_native_handle NativeHandle, pi_context Context, bool OwnNativeHandle, pi_event *Event)
Creates PI event object from a native handle.
Definition: pi2ur.hpp:4076
pi2ur::piProgramCreate
pi_result piProgramCreate(pi_context Context, const void *ILBytes, size_t Length, pi_program *Program)
Definition: pi2ur.hpp:1836
_pi_mem_advice
_pi_mem_advice
Definition: pi.h:567
pi2ur::piextEventGetNativeHandle
pi_result piextEventGetNativeHandle(pi_event Event, pi_native_handle *NativeHandle)
Gets the native handle of a PI event object.
Definition: pi2ur.hpp:4008
piextEnqueueWriteHostPipe
pi_result piextEnqueueWriteHostPipe(pi_queue Queue, pi_program Program, const char *PipeSymbol, pi_bool Blocking, void *Ptr, size_t Size, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *Event)
Write to pipe of a given name.
Definition: pi_cuda.cpp:1001
pi2ur::piextCommandBufferMemBufferRead
pi_result piextCommandBufferMemBufferRead(pi_ext_command_buffer CommandBuffer, pi_mem Src, size_t Offset, size_t Size, void *Dst, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a mem buffer read command to the command-buffer.
Definition: pi2ur.hpp:4436
pi2ur::piextMemMapExternalArray
pi_result piextMemMapExternalArray(pi_context Context, pi_device Device, pi_image_format *ImageFormat, pi_image_desc *ImageDesc, pi_interop_mem_handle MemHandle, pi_image_mem_handle *RetMem)
API to map an interop memory handle to an image memory handle.
Definition: pi2ur.hpp:4955
piextPeerAccessGetInfo
pi_result piextPeerAccessGetInfo(pi_device command_device, pi_device peer_device, pi_peer_attr attr, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi_cuda.cpp:1175
piextUSMRelease
pi_result piextUSMRelease(const void *HostPtr, pi_context Context)
Release host system memory from USM.
Definition: pi_cuda.cpp:957
pi2ur::piGetDeviceAndHostTimer
pi_result piGetDeviceAndHostTimer(pi_device Device, uint64_t *DeviceTime, uint64_t *HostTime)
Queries device for it's global timestamp in nanoseconds, and updates HostTime with the value of the h...
Definition: pi2ur.hpp:1390
syclcompat::detail::memset
static sycl::event memset(sycl::queue q, void *dev_ptr, int value, size_t size)
Set value to the first size bytes starting from dev_ptr in q.
Definition: memory.hpp:202
piMemImageGetInfo
pi_result piMemImageGetInfo(pi_mem Image, pi_image_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi_cuda.cpp:758
_pi_plugin::PluginVersion
char PluginVersion[20]
Definition: pi.h:2704
_pi_result
_pi_result
Definition: pi.h:205
pi_context_properties
intptr_t pi_context_properties
Definition: pi.h:654
pi2ur::piEventSetStatus
pi_result piEventSetStatus(pi_event Event, pi_int32 ExecutionStatus)
Definition: pi2ur.hpp:4113
pi2ur::piPlatformsGet
pi_result piPlatformsGet(pi_uint32 NumEntries, pi_platform *Platforms, pi_uint32 *NumPlatforms)
Definition: pi2ur.hpp:800
piContextRelease
pi_result piContextRelease(pi_context Context)
Definition: pi_cuda.cpp:152
_pi_device_type
_pi_device_type
Definition: pi.h:253
cuda_definitions.hpp
piEnqueueMemBufferReadRect
pi_result piEnqueueMemBufferReadRect(pi_queue Queue, pi_mem Buffer, pi_bool BlockingRead, pi_buff_rect_offset BufferOffset, pi_buff_rect_offset HostOffset, pi_buff_rect_region Region, size_t BufferRowPitch, size_t BufferSlicePitch, size_t HostRowPitch, size_t HostSlicePitch, void *Ptr, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
Definition: pi_cuda.cpp:663
pi2ur::piProgramRelease
pi_result piProgramRelease(pi_program Program)
Definition: pi2ur.hpp:2450
pi2ur::piextUSMEnqueueMemset2D
pi_result piextUSMEnqueueMemset2D(pi_queue Queue, void *Ptr, size_t Pitch, int Value, size_t Width, size_t Height, pi_uint32 NumEventsWaitList, const pi_event *EventsWaitList, pi_event *Event)
USM 2D Memset API.
Definition: pi2ur.hpp:3332
pi2ur::piextDisablePeerAccess
pi_result piextDisablePeerAccess(pi_device command_device, pi_device peer_device)
Definition: pi2ur.hpp:4538
pi2ur::piextWaitExternalSemaphore
pi_result piextWaitExternalSemaphore(pi_queue Queue, pi_interop_semaphore_handle SemHandle, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
API to instruct the queue with a non-blocking wait on an external semaphore.
Definition: pi2ur.hpp:5039
piextKernelCreateWithNativeHandle
pi_result piextKernelCreateWithNativeHandle(pi_native_handle NativeHandle, pi_context Context, pi_program Program, bool OwnNativeHandle, pi_kernel *Kernel)
Creates PI kernel object from a native handle.
Definition: pi_cuda.cpp:541
_pi_platform
Definition: pi_cuda.hpp:44
pi2ur::piMemImageGetInfo
pi_result piMemImageGetInfo(pi_mem Image, pi_image_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi2ur.hpp:3416
pi2ur::piProgramLink
pi_result piProgramLink(pi_context Context, pi_uint32 NumDevices, const pi_device *DeviceList, const char *Options, pi_uint32 NumInputPrograms, const pi_program *InputPrograms, void(*PFnNotify)(pi_program Program, void *UserData), void *UserData, pi_program *RetProgram)
Definition: pi2ur.hpp:1966
pi_ext_command_buffer_desc
Definition: pi.h:2266
piPluginGetBackendOption
pi_result piPluginGetBackendOption(pi_platform platform, const char *frontend_option, const char **backend_option)
API to get backend specific option.
Definition: pi_cuda.cpp:51
pi2ur::piKernelCreate
pi_result piKernelCreate(pi_program Program, const char *KernelName, pi_kernel *RetKernel)
Definition: pi2ur.hpp:2077
pi2ur::piEventCreate
pi_result piEventCreate(pi_context Context, pi_event *RetEvent)
Create PI event object in a signalled/completed state.
Definition: pi2ur.hpp:4061
pi2ur::piEnqueueMemImageCopy
pi_result piEnqueueMemImageCopy(pi_queue Queue, pi_mem SrcImage, pi_mem DstImage, pi_image_offset SrcOrigin, pi_image_offset DstOrigin, pi_image_region Region, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Definition: pi2ur.hpp:3056
pi2ur::piextKernelCreateWithNativeHandle
pi_result piextKernelCreateWithNativeHandle(pi_native_handle NativeHandle, pi_context Context, pi_program Program, bool OwnNativeHandle, pi_kernel *Kernel)
Creates PI kernel object from a native handle.
Definition: pi2ur.hpp:2215
piextDisablePeerAccess
pi_result piextDisablePeerAccess(pi_device command_device, pi_device peer_device)
Definition: pi_cuda.cpp:1169
piextMemCreateWithNativeHandle
pi_result piextMemCreateWithNativeHandle(pi_native_handle NativeHandle, pi_context Context, bool ownNativeHandle, pi_mem *Mem)
Creates PI mem object from a native handle.
Definition: pi_cuda.cpp:235
pi.hpp
pi2ur::piextUSMEnqueueMemcpy2D
pi_result piextUSMEnqueueMemcpy2D(pi_queue Queue, pi_bool Blocking, void *DstPtr, size_t DstPitch, const void *SrcPtr, size_t SrcPitch, size_t Width, size_t Height, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
USM 2D Memcpy API.
Definition: pi2ur.hpp:3475
_pi_device_info
_pi_device_info
Definition: pi.h:285
piextUSMEnqueueMemset2D
pi_result piextUSMEnqueueMemset2D(pi_queue Queue, void *Ptr, size_t Pitch, int Value, size_t Width, size_t Height, pi_uint32 NumEventsWaitList, const pi_event *EventsWaitlist, pi_event *Event)
USM 2D Memset API.
Definition: pi_cuda.cpp:922
piextUSMEnqueueMemAdvise
pi_result piextUSMEnqueueMemAdvise(pi_queue Queue, const void *Ptr, size_t Length, pi_mem_advice Advice, pi_event *OutEvent)
USM Memadvise API.
Definition: pi_cuda.cpp:902
_pi_image_info
_pi_image_info
Definition: pi.h:497
pi2ur::piextMemSampledImageCreate
pi_result piextMemSampledImageCreate(pi_context Context, pi_device Device, pi_image_mem_handle ImgMem, pi_image_format *ImageFormat, pi_image_desc *ImageDesc, pi_sampler Sampler, pi_mem *RetMem, pi_image_handle *RetHandle)
API to create sampled bindless image handles.
Definition: pi2ur.hpp:4633
pi2ur::piextEnqueueDeviceGlobalVariableRead
pi_result piextEnqueueDeviceGlobalVariableRead(pi_queue Queue, pi_program Program, const char *Name, pi_bool BlockingRead, size_t Count, size_t Offset, void *Dst, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
API reading data from a device global variable to host.
Definition: pi2ur.hpp:2607
piextSignalExternalSemaphore
pi_result piextSignalExternalSemaphore(pi_queue Queue, pi_interop_semaphore_handle SemHandle, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
API to instruct the queue to signal the external semaphore handle once all previous commands have com...
Definition: pi_cuda.cpp:494
pi2ur::piDevicesGet
pi_result piDevicesGet(pi_platform Platform, pi_device_type DeviceType, pi_uint32 NumEntries, pi_device *Devices, pi_uint32 *NumDevices)
Definition: pi2ur.hpp:930
piextMemGetNativeHandle
pi_result piextMemGetNativeHandle(pi_mem Mem, pi_native_handle *NativeHandle)
Gets the native handle of a PI mem object.
Definition: pi_cuda.cpp:231
pi2ur::piTearDown
pi_result piTearDown(void *PluginParameter)
API to notify that the plugin should clean up its resources.
Definition: pi2ur.hpp:772
_pi_kernel
Definition: pi_cuda.hpp:72
pi2ur::piQueueFinish
pi_result piQueueFinish(pi_queue Queue)
Definition: pi2ur.hpp:1747
pi2ur::piEnqueueMemBufferWriteRect
pi_result piEnqueueMemBufferWriteRect(pi_queue Queue, pi_mem Buffer, pi_bool BlockingWrite, pi_buff_rect_offset BufferOffset, pi_buff_rect_offset HostOffset, pi_buff_rect_region Region, size_t BufferRowPitch, size_t BufferSlicePitch, size_t HostRowPitch, size_t HostSlicePitch, const void *Ptr, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Definition: pi2ur.hpp:3768
pi2ur::piextCommandBufferMemBufferWrite
pi_result piextCommandBufferMemBufferWrite(pi_ext_command_buffer CommandBuffer, pi_mem Buffer, size_t Offset, size_t Size, const void *Ptr, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a mem buffer write command to the command-buffer.
Definition: pi2ur.hpp:4484
piextUSMPitchedAlloc
pi_result piextUSMPitchedAlloc(void **ResultPtr, size_t *ResultPitch, pi_context Context, pi_device Device, pi_usm_mem_properties *Properties, size_t WidthInBytes, size_t Height, unsigned int ElementSizeBytes)
Allocates memory accessible on device.
Definition: pi_cuda.cpp:846
piextEnqueueDeviceGlobalVariableRead
pi_result piextEnqueueDeviceGlobalVariableRead(pi_queue Queue, pi_program Program, const char *Name, pi_bool BlockingRead, size_t Count, size_t Offset, void *Dst, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *Event)
API reading data from a device global variable to host.
Definition: pi_cuda.cpp:970
pi2ur::piextMemImageFree
pi_result piextMemImageFree(pi_context Context, pi_device Device, pi_image_mem_handle MemoryHandle)
API to free memory for bindless images.
Definition: pi2ur.hpp:4759
piSamplerRetain
pi_result piSamplerRetain(pi_sampler Sampler)
Definition: pi_cuda.cpp:626
_pi_plugin::PiVersion
char PiVersion[20]
Definition: pi.h:2702
pi2ur::piextMemImportOpaqueFD
pi_result piextMemImportOpaqueFD(pi_context Context, pi_device Device, size_t Size, int FileDescriptor, pi_interop_mem_handle *RetHandle)
API to import external memory in the form of a file descriptor.
Definition: pi2ur.hpp:4930
piextMemImageGetInfo
pi_result piextMemImageGetInfo(pi_image_mem_handle MemHandle, pi_image_info ParamName, void *ParamValue, size_t *ParamValueSizeRet)
API to query an image memory handle for specific properties.
Definition: pi_cuda.cpp:444
_pi_ext_command_buffer
Definition: pi_cuda.hpp:80
pi2ur::piextKernelGetNativeHandle
pi_result piextKernelGetNativeHandle(pi_kernel Kernel, pi_native_handle *NativeHandle)
Gets the native handle of a PI kernel object.
Definition: pi2ur.hpp:2548
piEnqueueMemBufferWrite
pi_result piEnqueueMemBufferWrite(pi_queue Queue, pi_mem Buffer, pi_bool BlockingWrite, size_t Offset, size_t Size, const void *Ptr, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
Definition: pi_cuda.cpp:677
piProgramRetain
pi_result piProgramRetain(pi_program Program)
Definition: pi_cuda.cpp:314
_pi_queue_info
_pi_queue_info
Definition: pi.h:465
pi2ur::piEnqueueMemImageFill
pi_result piEnqueueMemImageFill(pi_queue Queue, pi_mem Image, const void *FillColor, const size_t *Origin, const size_t *Region, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *Event)
Definition: pi2ur.hpp:2094
pi2ur::piQueueRetain
pi_result piQueueRetain(pi_queue Queue)
Definition: pi2ur.hpp:1808
piProgramLink
pi_result piProgramLink(pi_context Context, pi_uint32 NumDevices, const pi_device *DeviceList, const char *Options, pi_uint32 NumInputPrograms, const pi_program *InputPrograms, void(*PFnNotify)(pi_program Program, void *UserData), void *UserData, pi_program *RetProgram)
Definition: pi_cuda.cpp:274
_pi_buffer_create_type
_pi_buffer_create_type
Definition: pi.h:625
pi2ur::piextProgramSetSpecializationConstant
pi_result piextProgramSetSpecializationConstant(pi_program Program, pi_uint32 SpecID, size_t Size, const void *SpecValue)
Sets a specialization constant to a specific value.
Definition: pi2ur.hpp:2060
pi2ur::piDevicePartition
pi_result piDevicePartition(pi_device Device, const pi_device_partition_property *Properties, pi_uint32 NumEntries, pi_device *SubDevices, pi_uint32 *NumSubDevices)
Definition: pi2ur.hpp:1314
pi2ur::piextUSMHostAlloc
pi_result piextUSMHostAlloc(void **ResultPtr, pi_context Context, pi_usm_mem_properties *Properties, size_t Size, pi_uint32 Alignment)
Allocates host memory accessible by the device.
Definition: pi2ur.hpp:2675
piEnqueueMemBufferCopy
pi_result piEnqueueMemBufferCopy(pi_queue Queue, pi_mem SrcMem, pi_mem DstMem, size_t SrcOffset, size_t DstOffset, size_t Size, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
Definition: pi_cuda.cpp:703
SupportedVersion
const char SupportedVersion[]
Definition: pi_cuda.cpp:1184
pi2ur::piEnqueueMemImageWrite
pi_result piEnqueueMemImageWrite(pi_queue Queue, pi_mem Image, pi_bool BlockingWrite, pi_image_offset Origin, pi_image_region Region, size_t InputRowPitch, size_t InputSlicePitch, const void *Ptr, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Definition: pi2ur.hpp:3533
piextMemImageCreateWithNativeHandle
pi_result piextMemImageCreateWithNativeHandle(pi_native_handle NativeHandle, pi_context Context, bool OwnNativeHandle, const pi_image_format *ImageFormat, const pi_image_desc *ImageDesc, pi_mem *Img)
Creates PI image object from a native handle.
Definition: pi_cuda.cpp:258
pi2ur::piextCommandBufferRelease
pi_result piextCommandBufferRelease(pi_ext_command_buffer CommandBuffer)
API to decrement the reference count of the command-buffer.
Definition: pi2ur.hpp:4309
piEnqueueMemImageCopy
pi_result piEnqueueMemImageCopy(pi_queue Queue, pi_mem SrcImage, pi_mem DstImage, pi_image_offset SrcOrigin, pi_image_offset DstOrigin, pi_image_region Region, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
Definition: pi_cuda.cpp:792
piDevicePartition
pi_result piDevicePartition(pi_device Device, const pi_device_partition_property *Properties, pi_uint32 NumDevices, pi_device *OutDevices, pi_uint32 *OutNumDevices)
Definition: pi_cuda.cpp:80
piextImportExternalSemaphoreOpaqueFD
pi_result piextImportExternalSemaphoreOpaqueFD(pi_context Context, pi_device Device, int FileDescriptor, pi_interop_semaphore_handle *RetHandle)
API to import an external semaphore in the form of a file descriptor.
Definition: pi_cuda.cpp:473
piKernelCreate
pi_result piKernelCreate(pi_program Program, const char *KernelName, pi_kernel *RetKernel)
Definition: pi_cuda.cpp:335
piextKernelSetArgPointer
pi_result piextKernelSetArgPointer(pi_kernel Kernel, pi_uint32 ArgIndex, size_t ArgSize, const void *ArgValue)
Sets up pointer arguments for CL kernels.
Definition: pi_cuda.cpp:868
piextMemSampledImageHandleDestroy
pi_result piextMemSampledImageHandleDestroy(pi_context Context, pi_device Device, pi_image_handle Handle)
API to destroy bindless sampled image handles.
Definition: pi_cuda.cpp:439
pi2ur::piSamplerGetInfo
pi_result piSamplerGetInfo(pi_sampler Sampler, pi_sampler_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi2ur.hpp:4204
pi2ur::piEnqueueMemBufferCopy
pi_result piEnqueueMemBufferCopy(pi_queue Queue, pi_mem SrcMem, pi_mem DstMem, size_t SrcOffset, size_t DstOffset, size_t Size, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Definition: pi2ur.hpp:3723
piextMemMapExternalArray
pi_result piextMemMapExternalArray(pi_context Context, pi_device Device, pi_image_format *ImageFormat, pi_image_desc *ImageDesc, pi_interop_mem_handle MemHandle, pi_image_mem_handle *RetMem)
API to map an interop memory handle to an image memory handle.
Definition: pi_cuda.cpp:459
_pi_queue
Definition: pi_cuda.hpp:60
piEnqueueMemBufferCopyRect
pi_result piEnqueueMemBufferCopyRect(pi_queue Queue, pi_mem SrcMem, pi_mem DstMem, pi_buff_rect_offset SrcOrigin, pi_buff_rect_offset DstOrigin, pi_buff_rect_region Region, size_t SrcRowPitch, size_t SrcSlicePitch, size_t DstRowPitch, size_t DstSlicePitch, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
Definition: pi_cuda.cpp:714
pi_uint32
uint32_t pi_uint32
Definition: pi.h:194
pi2ur::piContextGetInfo
pi_result piContextGetInfo(pi_context Context, pi_context_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi2ur.hpp:1520
piextEnqueueCommandBuffer
pi_result piextEnqueueCommandBuffer(pi_ext_command_buffer CommandBuffer, pi_queue Queue, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
API to submit the command-buffer to queue for execution, returns an error if the command-buffer is no...
Definition: pi_cuda.cpp:1140
pi_buff_rect_region_struct
Definition: pi.h:1025
piProgramGetBuildInfo
pi_result piProgramGetBuildInfo(pi_program Program, pi_device Device, pi_program_build_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi_cuda.cpp:304
pi2ur::piextMemGetNativeHandle
pi_result piextMemGetNativeHandle(pi_mem Mem, pi_native_handle *NativeHandle)
Gets the native handle of a PI mem object.
Definition: pi2ur.hpp:3042
pi_device_binary_struct
This struct is a record of the device binary information.
Definition: pi.h:959
piextEventCreateWithNativeHandle
pi_result piextEventCreateWithNativeHandle(pi_native_handle NativeHandle, pi_context Context, bool OwnNativeHandle, pi_event *Event)
Creates PI event object from a native handle.
Definition: pi_cuda.cpp:604
piextMemImportOpaqueFD
pi_result piextMemImportOpaqueFD(pi_context Context, pi_device Device, size_t Size, int FileDescriptor, pi_interop_mem_handle *RetHandle)
API to import external memory in the form of a file descriptor.
Definition: pi_cuda.cpp:453
pi_interop_mem_handle
pi_uint64 pi_interop_mem_handle
Definition: pi.h:1093
piextCommandBufferMemBufferCopyRect
pi_result piextCommandBufferMemBufferCopyRect(pi_ext_command_buffer CommandBuffer, pi_mem SrcMem, pi_mem DstMem, pi_buff_rect_offset SrcOrigin, pi_buff_rect_offset DstOrigin, pi_buff_rect_region Region, size_t SrcRowPitch, size_t SrcSlicePitch, size_t DstRowPitch, size_t DstSlicePitch, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a rectangular mem buffer copy command to the command-buffer.
Definition: pi_cuda.cpp:1084
pi2ur::piPluginGetLastError
pi_result piPluginGetLastError(char **Message)
API to get Plugin specific warning and error messages.
Definition: pi2ur.hpp:977
pi2ur::piextMemCreateWithNativeHandle
pi_result piextMemCreateWithNativeHandle(pi_native_handle NativeHandle, pi_context Context, bool OwnNativeHandle, pi_mem *Mem)
Creates PI mem object from a native handle.
Definition: pi2ur.hpp:3087
pi2ur::piEnqueueEventsWait
pi_result piEnqueueEventsWait(pi_queue Queue, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Definition: pi2ur.hpp:3903
_pi_kernel_exec_info
_pi_kernel_exec_info
Definition: pi.h:1530
pi2ur::piDeviceRelease
pi_result piDeviceRelease(pi_device Device)
Definition: pi2ur.hpp:969
pi2ur::piextPluginGetOpaqueData
pi_result piextPluginGetOpaqueData(void *opaque_data_param, void **opaque_data_return)
API to get Plugin internal data, opaque to SYCL RT.
Definition: pi2ur.hpp:907
piextContextCreateWithNativeHandle
pi_result piextContextCreateWithNativeHandle(pi_native_handle NativeHandle, pi_uint32 NumDevices, const pi_device *Devices, bool OwnNativeHandle, pi_context *RetContext)
Creates PI context object from a native handle.
Definition: pi_cuda.cpp:138
pi2ur::piextMemImageAllocate
pi_result piextMemImageAllocate(pi_context Context, pi_device Device, pi_image_format *ImageFormat, pi_image_desc *ImageDesc, pi_image_mem_handle *RetMem)
API to allocate memory for bindless images.
Definition: pi2ur.hpp:4583
pi2ur::piEnqueueMemBufferCopyRect
pi_result piEnqueueMemBufferCopyRect(pi_queue Queue, pi_mem SrcMem, pi_mem DstMem, pi_buff_rect_offset SrcOrigin, pi_buff_rect_offset DstOrigin, pi_buff_rect_region Region, size_t SrcRowPitch, size_t SrcSlicePitch, size_t DstRowPitch, size_t DstSlicePitch, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Definition: pi2ur.hpp:3689
pi2ur::piProgramCompile
pi_result piProgramCompile(pi_program Program, pi_uint32 NumDevices, const pi_device *DeviceList, const char *Options, pi_uint32 NumInputHeaders, const pi_program *InputHeaders, const char **HeaderIncludeNames, void(*PFnNotify)(pi_program Program, void *UserData), void *UserData)
Definition: pi2ur.hpp:1996
piMemGetInfo
pi_result piMemGetInfo(pi_mem Mem, pi_mem_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi_cuda.cpp:212
pi_mem_flags
pi_bitfield pi_mem_flags
Definition: pi.h:694
piextPlatformGetNativeHandle
pi_result piextPlatformGetNativeHandle(pi_platform Platform, pi_native_handle *NativeHandle)
Gets the native handle of a PI platform object.
Definition: pi_cuda.cpp:37
piQueueGetInfo
pi_result piQueueGetInfo(pi_queue Queue, pi_queue_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi_cuda.cpp:167
pi2ur::piextMemMipmapGetLevel
pi_result piextMemMipmapGetLevel(pi_context Context, pi_device Device, pi_image_mem_handle MipMem, unsigned int Level, pi_image_mem_handle *RetMem)
API to retrieve individual image from mipmap.
Definition: pi2ur.hpp:4740
pi2ur::piextMemUnsampledImageCreate
pi_result piextMemUnsampledImageCreate(pi_context Context, pi_device Device, pi_image_mem_handle ImgMem, pi_image_format *ImageFormat, pi_image_desc *ImageDesc, pi_mem *RetMem, pi_image_handle *RetHandle)
API to create bindless image handles.
Definition: pi2ur.hpp:4606
pi2ur::piDeviceRetain
pi_result piDeviceRetain(pi_device Device)
Definition: pi2ur.hpp:961
pi2ur::piextBindlessImageSamplerCreate
pi_result piextBindlessImageSamplerCreate(pi_context Context, const pi_sampler_properties *SamplerProperties, float MinMipmapLevelClamp, float MaxMipmapLevelClamp, float MaxAnisotropy, pi_sampler *RetSampler)
API to create samplers for bindless images.
Definition: pi2ur.hpp:4662
pi_context_extended_deleter
void(* pi_context_extended_deleter)(void *user_data)
Definition: pi.h:1271
piextUSMEnqueueFill2D
pi_result piextUSMEnqueueFill2D(pi_queue Queue, void *Ptr, size_t Pitch, size_t PatternSize, const void *Pattern, size_t Width, size_t Height, pi_uint32 NumEventsWaitList, const pi_event *EventsWaitList, pi_event *Event)
USM 2D fill API.
Definition: pi_cuda.cpp:909
pi2ur::piKernelSetExecInfo
pi_result piKernelSetExecInfo(pi_kernel Kernel, pi_kernel_exec_info ParamName, size_t ParamValueSize, const void *ParamValue)
API to set attributes controlling kernel execution.
Definition: pi2ur.hpp:2249
pi2ur::piKernelGetInfo
pi_result piKernelGetInfo(pi_kernel Kernel, pi_kernel_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi2ur.hpp:2330
piextEventGetNativeHandle
pi_result piextEventGetNativeHandle(pi_event Event, pi_native_handle *NativeHandle)
Gets the native handle of a PI event object.
Definition: pi_cuda.cpp:598
piextCommandBufferNDRangeKernel
pi_result piextCommandBufferNDRangeKernel(pi_ext_command_buffer CommandBuffer, pi_kernel Kernel, pi_uint32 WorkDim, const size_t *GlobalWorkOffset, const size_t *GlobalWorkSize, const size_t *LocalWorkSize, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a kernel execution command to the command-buffer.
Definition: pi_cuda.cpp:1055
piextContextGetNativeHandle
pi_result piextContextGetNativeHandle(pi_context Context, pi_native_handle *NativeHandle)
Gets the native handle of a PI context object.
Definition: pi_cuda.cpp:133
piContextGetInfo
pi_result piContextGetInfo(pi_context Context, pi_context_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi_cuda.cpp:119
defines.hpp
pi2ur::piextUSMFree
pi_result piextUSMFree(pi_context Context, void *Ptr)
Indicates that the allocated USM memory is no longer needed on the runtime side.
Definition: pi2ur.hpp:3196
piextMemSampledImageCreate
pi_result piextMemSampledImageCreate(pi_context Context, pi_device Device, pi_image_mem_handle ImgMem, pi_image_format *ImageFormat, pi_image_desc *ImageDesc, pi_sampler Sampler, pi_mem *RetMem, pi_image_handle *RetHandle)
API to create sampled bindless image handles.
Definition: pi_cuda.cpp:385
pi2ur::piextCommandBufferFinalize
pi_result piextCommandBufferFinalize(pi_ext_command_buffer CommandBuffer)
API to stop command-buffer recording such that no more commands can be appended, and makes the comman...
Definition: pi2ur.hpp:4319
pi2ur::piextUSMEnqueueMemcpy
pi_result piextUSMEnqueueMemcpy(pi_queue Queue, pi_bool Blocking, void *DstPtr, const void *SrcPtr, size_t Size, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
USM Memcpy API.
Definition: pi2ur.hpp:3748
pi2ur::piextDeviceSelectBinary
pi_result piextDeviceSelectBinary(pi_device Device, pi_device_binary *Binaries, pi_uint32 NumBinaries, pi_uint32 *SelectedBinaryInd)
Selects the most appropriate device binary based on runtime information and the IR characteristics.
Definition: pi2ur.hpp:1398
piPluginInit
pi_result piPluginInit(pi_plugin *PluginInit)
Definition: pi_cuda.cpp:1186
piEnqueueMemUnmap
pi_result piEnqueueMemUnmap(pi_queue Queue, pi_mem Mem, void *MappedPtr, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *OutEvent)
Definition: pi_cuda.cpp:750
pi2ur::piextCommandBufferCreate
pi_result piextCommandBufferCreate(pi_context Context, pi_device Device, const pi_ext_command_buffer_desc *Desc, pi_ext_command_buffer *RetCommandBuffer)
API to create a command-buffer.
Definition: pi2ur.hpp:4282
pi2ur::piQueueGetInfo
pi_result piQueueGetInfo(pi_queue Queue, pi_queue_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi2ur.hpp:1758
piEventGetInfo
pi_result piEventGetInfo(pi_event Event, pi_event_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi_cuda.cpp:560
pi_ext_sync_point
pi_uint32 pi_ext_sync_point
Definition: pi.h:2260
pi2ur::piextQueueCreateWithNativeHandle
pi_result piextQueueCreateWithNativeHandle(pi_native_handle NativeHandle, int32_t NativeHandleDesc, pi_context Context, pi_device Device, bool OwnNativeHandle, pi_queue_properties *Properties, pi_queue *Queue)
Creates PI queue object from a native handle.
Definition: pi2ur.hpp:1671
piDeviceGetInfo
pi_result piDeviceGetInfo(pi_device Device, pi_device_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Returns requested info for provided native device Return PI_DEVICE_INFO_EXTENSION_DEVICELIB_ASSERT fo...
Definition: pi_cuda.cpp:73
pi2ur::piMemBufferCreate
pi_result piMemBufferCreate(pi_context Context, pi_mem_flags Flags, size_t Size, void *HostPtr, pi_mem *RetMem, const pi_mem_properties *properties)
Definition: pi2ur.hpp:2634
pi2ur::piextUSMRelease
pi_result piextUSMRelease(const void *HostPtr, pi_context Context)
Release host system memory from USM.
Definition: pi2ur.hpp:3405
piextUSMDeviceAlloc
pi_result piextUSMDeviceAlloc(void **ResultPtr, pi_context Context, pi_device Device, pi_usm_mem_properties *Properties, size_t Size, pi_uint32 Alignment)
Allocates device memory.
Definition: pi_cuda.cpp:828
pi2ur::piextUSMEnqueuePrefetch
pi_result piextUSMEnqueuePrefetch(pi_queue Queue, const void *Ptr, size_t Size, pi_usm_migration_flags Flags, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Hint to migrate memory to the device.
Definition: pi2ur.hpp:3232
sycl::_V1::ext::oneapi::experimental::detail::Alignment
@ Alignment
Definition: property.hpp:193
piextUSMGetMemAllocInfo
pi_result piextUSMGetMemAllocInfo(pi_context Context, const void *Ptr, pi_mem_alloc_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
API to query information about USM allocated pointers Valid Queries: PI_MEM_ALLOC_TYPE returns host/d...
Definition: pi_cuda.cpp:945
piextDeviceGetNativeHandle
pi_result piextDeviceGetNativeHandle(pi_device Device, pi_native_handle *NativeHandle)
Gets the native handle of a PI device object.
Definition: pi_cuda.cpp:95
pi2ur::piSamplerRetain
pi_result piSamplerRetain(pi_sampler Sampler)
Definition: pi2ur.hpp:4253
piextQueueCreate
pi_result piextQueueCreate(pi_context Context, pi_device Device, pi_queue_properties *Properties, pi_queue *Queue)
Definition: pi_cuda.cpp:162
piGetDeviceAndHostTimer
pi_result piGetDeviceAndHostTimer(pi_device Device, uint64_t *DeviceTime, uint64_t *HostTime)
Queries device for it's global timestamp in nanoseconds, and updates HostTime with the value of the h...
Definition: pi_cuda.cpp:1158
pi_uint64
uint64_t pi_uint64
Definition: pi.h:195
pi2ur::piextUSMDeviceAlloc
pi_result piextUSMDeviceAlloc(void **ResultPtr, pi_context Context, pi_device Device, pi_usm_mem_properties *Properties, size_t Size, pi_uint32 Alignment)
Allocates device memory.
Definition: pi2ur.hpp:3108
pi2ur::piextCommandBufferRetain
pi_result piextCommandBufferRetain(pi_ext_command_buffer CommandBuffer)
API to increment the reference count of the command-buffer.
Definition: pi2ur.hpp:4299
piEventGetProfilingInfo
pi_result piEventGetProfilingInfo(pi_event Event, pi_profiling_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi_cuda.cpp:567
_pi_event_info
_pi_event_info
Definition: pi.h:514
piextCommandBufferMemBufferCopy
pi_result piextCommandBufferMemBufferCopy(pi_ext_command_buffer CommandBuffer, pi_mem SrcMem, pi_mem DstMem, size_t SrcOffset, size_t DstOffset, size_t Size, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a mem buffer copy command to the command-buffer.
Definition: pi_cuda.cpp:1074
_PI_CUDA_PLUGIN_VERSION_STRING
#define _PI_CUDA_PLUGIN_VERSION_STRING
Definition: pi_cuda.hpp:25
piContextCreate
pi_result piContextCreate(const pi_context_properties *Properties, pi_uint32 NumDevices, const pi_device *Devices, void(*PFnNotify)(const char *ErrInfo, const void *PrivateInfo, size_t CB, void *UserData), void *UserData, pi_context *RetContext)
Definition: pi_cuda.cpp:109
_pi_sampler_info
_pi_sampler_info
Definition: pi.h:630
_pi_device_binary_property_struct
Definition: pi.h:855
pi_mem_properties
pi_bitfield pi_mem_properties
Definition: pi.h:710
_pi_program
Definition: pi_cuda.hpp:68
pi2ur::piEnqueueMemBufferWrite
pi_result piEnqueueMemBufferWrite(pi_queue Queue, pi_mem Buffer, pi_bool BlockingWrite, size_t Offset, size_t Size, const void *Ptr, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Definition: pi2ur.hpp:3802
pi2ur::piextMemImageGetInfo
pi_result piextMemImageGetInfo(pi_image_mem_handle MemHandle, pi_image_info ParamName, void *ParamValue, size_t *ParamValueSizeRet)
API to query an image memory handle for specific properties.
Definition: pi2ur.hpp:4903
pi_cuda.hpp
_pi_sampler
Definition: pi_cuda.hpp:76
pi2ur::piextDestroyExternalSemaphore
pi_result piextDestroyExternalSemaphore(pi_context Context, pi_device Device, pi_interop_semaphore_handle SemHandle)
API to destroy the external semaphore handle.
Definition: pi2ur.hpp:5022
pi2ur::piProgramGetInfo
pi_result piProgramGetInfo(pi_program Program, pi_program_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi2ur.hpp:1906
piQueueFlush
pi_result piQueueFlush(pi_queue Queue)
Definition: pi_cuda.cpp:183
piEnqueueMemBufferMap
pi_result piEnqueueMemBufferMap(pi_queue Queue, pi_mem Mem, pi_bool BlockingMap, pi_map_flags MapFlags, size_t Offset, size_t Size, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *OutEvent, void **RetMap)
Definition: pi_cuda.cpp:739
piextDeviceCreateWithNativeHandle
pi_result piextDeviceCreateWithNativeHandle(pi_native_handle NativeHandle, pi_platform Platform, pi_device *Device)
Creates PI device object from a native handle.
Definition: pi_cuda.cpp:101
piQueueFinish
pi_result piQueueFinish(pi_queue Queue)
Definition: pi_cuda.cpp:181
pi2ur::piextQueueGetNativeHandle
pi_result piextQueueGetNativeHandle(pi_queue Queue, pi_native_handle *NativeHandle, int32_t *NativeHandleDesc)
Gets the native handle of a PI queue object.
Definition: pi2ur.hpp:1717
pi2ur::piextKernelSetArgPointer
pi_result piextKernelSetArgPointer(pi_kernel Kernel, pi_uint32 ArgIndex, size_t, const void *ArgValue)
Sets up pointer arguments for CL kernels.
Definition: pi2ur.hpp:2462
piDeviceRelease
pi_result piDeviceRelease(pi_device Device)
Definition: pi_cuda.cpp:69
piPlatformGetInfo
pi_result piPlatformGetInfo(pi_platform Platform, pi_platform_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi_cuda.cpp:30
piEventCreate
pi_result piEventCreate(pi_context Context, pi_event *RetEvent)
Create PI event object in a signalled/completed state.
Definition: pi_cuda.cpp:556
pi2ur::piextContextGetNativeHandle
pi_result piextContextGetNativeHandle(pi_context Context, pi_native_handle *NativeHandle)
Gets the native handle of a PI context object.
Definition: pi2ur.hpp:1486
piQueueRelease
pi_result piQueueRelease(pi_queue Queue)
Definition: pi_cuda.cpp:177
pi_native_handle
uintptr_t pi_native_handle
Definition: pi.h:198
piextPluginGetOpaqueData
pi_result piextPluginGetOpaqueData(void *opaque_data_param, void **opaque_data_return)
API to get Plugin internal data, opaque to SYCL RT.
Definition: pi_cuda.cpp:1149
pi2ur::piProgramGetBuildInfo
pi_result piProgramGetBuildInfo(pi_program Program, pi_device Device, pi_program_build_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi2ur.hpp:2508
piextDeviceSelectBinary
pi_result piextDeviceSelectBinary(pi_device Device, pi_device_binary *Binaries, pi_uint32 NumBinaries, pi_uint32 *SelectedBinaryInd)
Selects the most appropriate device binary based on runtime information and the IR characteristics.
Definition: pi_cuda.cpp:88
pi2ur::piQueueRelease
pi_result piQueueRelease(pi_queue Queue)
Definition: pi2ur.hpp:1737
pi_sampler_properties
pi_bitfield pi_sampler_properties
Definition: pi.h:662
piTearDown
pi_result piTearDown(void *PluginParameter)
API to notify that the plugin should clean up its resources.
Definition: pi_cuda.cpp:1154
piEnqueueMemImageWrite
pi_result piEnqueueMemImageWrite(pi_queue Queue, pi_mem Image, pi_bool BlockingWrite, pi_image_offset Origin, pi_image_region Region, size_t InputRowPitch, size_t InputSlicePitch, const void *Ptr, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
Definition: pi_cuda.cpp:778
pi2ur::piEnqueueMemBufferReadRect
pi_result piEnqueueMemBufferReadRect(pi_queue Queue, pi_mem Buffer, pi_bool BlockingRead, pi_buff_rect_offset BufferOffset, pi_buff_rect_offset HostOffset, pi_buff_rect_region Region, size_t BufferRowPitch, size_t BufferSlicePitch, size_t HostRowPitch, size_t HostSlicePitch, void *Ptr, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Definition: pi2ur.hpp:3826
pi2ur::piMemImageCreate
pi_result piMemImageCreate(pi_context Context, pi_mem_flags Flags, const pi_image_format *ImageFormat, const pi_image_desc *ImageDesc, void *HostPtr, pi_mem *RetImage)
Definition: pi2ur.hpp:2924
piProgramGetInfo
pi_result piProgramGetInfo(pi_program Program, pi_program_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi_cuda.cpp:266
_pi_image_format
Definition: pi.h:1096
piProgramCreate
pi_result piProgramCreate(pi_context Context, const void *ILBytes, size_t Length, pi_program *Program)
Definition: pi_cuda.cpp:242
_pi_kernel_info
_pi_kernel_info
Definition: pi.h:477
piKernelGetSubGroupInfo
pi_result piKernelGetSubGroupInfo(pi_kernel Kernel, pi_device Device, pi_kernel_sub_group_info ParamName, size_t InputValueSize, const void *InputValue, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
API to query information from the sub-group from a kernel.
Definition: pi_cuda.cpp:510
pi2ur::piextUSMEnqueueFill2D
pi_result piextUSMEnqueueFill2D(pi_queue Queue, void *Ptr, size_t Pitch, size_t PatternSize, const void *Pattern, size_t Width, size_t Height, pi_uint32 NumEventsWaitList, const pi_event *EventsWaitList, pi_event *Event)
USM 2D Fill API.
Definition: pi2ur.hpp:3313
pi2ur::piEventRelease
pi_result piEventRelease(pi_event Event)
Definition: pi2ur.hpp:4129
pi2ur::piextMemSampledImageHandleDestroy
pi_result piextMemSampledImageHandleDestroy(pi_context Context, pi_device Device, pi_image_handle Handle)
API to destroy bindless sampled image handles.
Definition: pi2ur.hpp:4866
piextMemUnsampledImageHandleDestroy
pi_result piextMemUnsampledImageHandleDestroy(pi_context Context, pi_device Device, pi_image_handle Handle)
API to destroy bindless unsampled image handles.
Definition: pi_cuda.cpp:434
piextCommandBufferCreate
pi_result piextCommandBufferCreate(pi_context Context, pi_device Device, const pi_ext_command_buffer_desc *Desc, pi_ext_command_buffer *RetCommandBuffer)
API to create a command-buffer.
Definition: pi_cuda.cpp:1036
piextWaitExternalSemaphore
pi_result piextWaitExternalSemaphore(pi_queue Queue, pi_interop_semaphore_handle SemHandle, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
API to instruct the queue with a non-blocking wait on an external semaphore.
Definition: pi_cuda.cpp:486
pi2ur::piextEnqueueCommandBuffer
pi_result piextEnqueueCommandBuffer(pi_ext_command_buffer CommandBuffer, pi_queue Queue, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
API to submit the command-buffer to queue for execution, returns an error if the command-buffer is no...
Definition: pi2ur.hpp:4502
piextCommandBufferMemBufferRead
pi_result piextCommandBufferMemBufferRead(pi_ext_command_buffer CommandBuffer, pi_mem Buffer, size_t Offset, size_t Size, void *Dst, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a mem buffer read command to the command-buffer.
Definition: pi_cuda.cpp:1096
piMemBufferPartition
pi_result piMemBufferPartition(pi_mem Buffer, pi_mem_flags Flags, pi_buffer_create_type BufferCreateType, void *BufferCreateInfo, pi_mem *RetMem)
Definition: pi_cuda.cpp:813
piextMemImageAllocate
pi_result piextMemImageAllocate(pi_context Context, pi_device Device, pi_image_format *ImageFormat, pi_image_desc *ImageDesc, pi_image_mem_handle *RetMem)
API to allocate memory for bindless images.
Definition: pi_cuda.cpp:368
pi2ur::piextMemReleaseInterop
pi_result piextMemReleaseInterop(pi_context Context, pi_device Device, pi_interop_mem_handle ExtMem)
API to destroy interop memory.
Definition: pi2ur.hpp:4980
pi_image_mem_handle
void * pi_image_mem_handle
Definition: pi.h:1092
piextContextSetExtendedDeleter
pi_result piextContextSetExtendedDeleter(pi_context Context, pi_context_extended_deleter Function, void *UserData)
Definition: pi_cuda.cpp:127
pi_image_handle
pi_uint64 pi_image_handle
Definition: pi.h:1091
piSamplerCreate
pi_result piSamplerCreate(pi_context Context, const pi_sampler_properties *SamplerProperties, pi_sampler *RetSampler)
Definition: pi_cuda.cpp:612
piEnqueueMemBufferWriteRect
pi_result piEnqueueMemBufferWriteRect(pi_queue Queue, pi_mem Buffer, pi_bool BlockingWrite, pi_buff_rect_offset BufferOffset, pi_buff_rect_offset HostOffset, pi_buff_rect_region Region, size_t BufferRowPitch, size_t BufferSlicePitch, size_t HostRowPitch, size_t HostSlicePitch, const void *Ptr, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
Definition: pi_cuda.cpp:689
pi2ur::piextCommandBufferMemBufferReadRect
pi_result piextCommandBufferMemBufferReadRect(pi_ext_command_buffer CommandBuffer, pi_mem Buffer, pi_buff_rect_offset BufferOffset, pi_buff_rect_offset HostOffset, pi_buff_rect_region Region, size_t BufferRowPitch, size_t BufferSlicePitch, size_t HostRowPitch, size_t HostSlicePitch, void *Ptr, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a rectangular mem buffer read command to the command-buffer.
Definition: pi2ur.hpp:4406
_PI_PLUGIN_VERSION_CHECK
#define _PI_PLUGIN_VERSION_CHECK(PI_API_VERSION, PI_PLUGIN_VERSION)
Definition: pi.h:171
pi2ur::piextCommandBufferNDRangeKernel
pi_result piextCommandBufferNDRangeKernel(pi_ext_command_buffer CommandBuffer, pi_kernel Kernel, pi_uint32 WorkDim, const size_t *GlobalWorkOffset, const size_t *GlobalWorkSize, const size_t *LocalWorkSize, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a kernel execution command to the command-buffer.
Definition: pi2ur.hpp:4328
piextCommandBufferMemBufferReadRect
pi_result piextCommandBufferMemBufferReadRect(pi_ext_command_buffer CommandBuffer, pi_mem Buffer, pi_buff_rect_offset BufferOffset, pi_buff_rect_offset HostOffset, pi_buff_rect_region Region, size_t BufferRowPitch, size_t BufferSlicePitch, size_t HostRowPitch, size_t HostSlicePitch, void *Ptr, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a rectangular mem buffer read command to the command-buffer.
Definition: pi_cuda.cpp:1105
pi2ur::piMemBufferPartition
pi_result piMemBufferPartition(pi_mem Buffer, pi_mem_flags Flags, pi_buffer_create_type BufferCreateType, void *BufferCreateInfo, pi_mem *RetMem)
Definition: pi2ur.hpp:2995
piextUSMSharedAlloc
pi_result piextUSMSharedAlloc(void **ResultPtr, pi_context Context, pi_device Device, pi_usm_mem_properties *Properties, size_t Size, pi_uint32 Alignment)
Allocates memory accessible on both host and device.
Definition: pi_cuda.cpp:837
piextMemMipmapGetLevel
pi_result piextMemMipmapGetLevel(pi_context Context, pi_device Device, pi_image_mem_handle MipMem, unsigned int Level, pi_image_mem_handle *RetMem)
API to retrieve individual image from mipmap.
Definition: pi_cuda.cpp:403
piextUSMHostAlloc
pi_result piextUSMHostAlloc(void **ResultPtr, pi_context Context, pi_usm_mem_properties *Properties, size_t Size, pi_uint32 Alignment)
Allocates host memory accessible by the device.
Definition: pi_cuda.cpp:856
pi2ur::piMemGetInfo
pi_result piMemGetInfo(pi_mem Mem, pi_mem_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi2ur.hpp:2689
piextMemUnsampledImageCreate
pi_result piextMemUnsampledImageCreate(pi_context Context, pi_device Device, pi_image_mem_handle ImgMem, pi_image_format *ImageFormat, pi_image_desc *ImageDesc, pi_mem *RetMem, pi_image_handle *RetHandle)
API to create bindless image handles.
Definition: pi_cuda.cpp:377
pi2ur::piMemRetain
pi_result piMemRetain(pi_mem Mem)
Definition: pi2ur.hpp:3203
pi2ur::piextQueueCreate
pi_result piextQueueCreate(pi_context Context, pi_device Device, pi_queue_properties *Properties, pi_queue *Queue)
Definition: pi2ur.hpp:1594
pi2ur::piEnqueueMemImageRead
pi_result piEnqueueMemImageRead(pi_queue Queue, pi_mem Image, pi_bool BlockingRead, pi_image_offset Origin, pi_image_region Region, size_t RowPitch, size_t SlicePitch, void *Ptr, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Definition: pi2ur.hpp:3562
piextCommandBufferMemBufferWrite
pi_result piextCommandBufferMemBufferWrite(pi_ext_command_buffer CommandBuffer, pi_mem Buffer, size_t Offset, size_t Size, const void *Ptr, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a mem buffer write command to the command-buffer.
Definition: pi_cuda.cpp:1118
pi_queue_properties
pi_bitfield pi_queue_properties
Definition: pi.h:729
_pi_platform_info
_pi_platform_info
Definition: pi.h:220
pi2ur::piextGetDeviceFunctionPointer
pi_result piextGetDeviceFunctionPointer(pi_device Device, pi_program Program, const char *FunctionName, pi_uint64 *FunctionPointerRet)
Retrieves a device function pointer to a user-defined function.
Definition: pi2ur.hpp:2113
piProgramCreateWithBinary
pi_result piProgramCreateWithBinary(pi_context Context, pi_uint32 NumDevices, const pi_device *DeviceList, const size_t *Lengths, const unsigned char **Binaries, size_t NumMetadataEntries, const pi_device_binary_property *Metadata, pi_int32 *BinaryStatus, pi_program *Program)
Creates a PI program for a context and loads the given binary into it.
Definition: pi_cuda.cpp:247
pi2ur::piextKernelSetArgMemObj
pi_result piextKernelSetArgMemObj(pi_kernel Kernel, pi_uint32 ArgIndex, const pi_mem_obj_property *ArgProperties, const pi_mem *ArgValue)
Definition: pi2ur.hpp:2134
_pi_image_desc
Definition: pi.h:1101
pi2ur::piextDeviceCreateWithNativeHandle
pi_result piextDeviceCreateWithNativeHandle(pi_native_handle NativeHandle, pi_platform Platform, pi_device *Device)
Creates PI device object from a native handle.
Definition: pi2ur.hpp:1296
piQueueRetain
pi_result piQueueRetain(pi_queue Queue)
Definition: pi_cuda.cpp:175
_pi_event
Definition: pi_cuda.hpp:64
pi2ur::piContextRelease
pi_result piContextRelease(pi_context Context)
Definition: pi2ur.hpp:1583
piQueueCreate
pi_result piQueueCreate(pi_context Context, pi_device Device, pi_queue_properties Flags, pi_queue *Queue)
Definition: pi_cuda.cpp:156
piextDestroyExternalSemaphore
pi_result piextDestroyExternalSemaphore(pi_context Context, pi_device Device, pi_interop_semaphore_handle SemHandle)
API to destroy the external semaphore handle.
Definition: pi_cuda.cpp:481
piextCommandBufferMemcpyUSM
pi_result piextCommandBufferMemcpyUSM(pi_ext_command_buffer CommandBuffer, void *DstPtr, const void *SrcPtr, size_t Size, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a USM memcpy command to the command-buffer.
Definition: pi_cuda.cpp:1065
pi2ur::piextMemImageCopy
pi_result piextMemImageCopy(pi_queue Queue, void *DstPtr, void *SrcPtr, const pi_image_format *ImageFormat, const pi_image_desc *ImageDesc, const pi_image_copy_flags Flags, pi_image_offset SrcOffset, pi_image_offset DstOffset, pi_image_region CopyExtent, pi_image_region HostExtent, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
API to copy image data Host to Device or Device to Host.
Definition: pi2ur.hpp:4809
pi2ur::piextMemUnsampledImageHandleDestroy
pi_result piextMemUnsampledImageHandleDestroy(pi_context Context, pi_device Device, pi_image_handle Handle)
API to destroy bindless unsampled image handles.
Definition: pi2ur.hpp:4850
piKernelGetInfo
pi_result piKernelGetInfo(pi_kernel Kernel, pi_kernel_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi_cuda.cpp:360
pi2ur::piSamplerRelease
pi_result piSamplerRelease(pi_sampler Sampler)
Definition: pi2ur.hpp:4264
pi2ur::piQueueFlush
pi_result piQueueFlush(pi_queue Queue)
Definition: pi2ur.hpp:1819
pi2ur::piextImportExternalSemaphoreOpaqueFD
pi_result piextImportExternalSemaphoreOpaqueFD(pi_context Context, pi_device Device, int FileDescriptor, pi_interop_semaphore_handle *RetHandle)
API to import an external semaphore in the form of a file descriptor.
Definition: pi2ur.hpp:4996
pi2ur::piDeviceGetInfo
pi_result piDeviceGetInfo(pi_device Device, pi_device_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Returns requested info for provided native device Return PI_DEVICE_INFO_EXTENSION_DEVICELIB_ASSERT fo...
Definition: pi2ur.hpp:994
piMemRetain
pi_result piMemRetain(pi_mem Mem)
Definition: pi_cuda.cpp:218
_pi_mem_info
_pi_mem_info
Definition: pi.h:1117
pi_image_offset_struct
Definition: pi.h:1034
pi2ur::piContextRetain
pi_result piContextRetain(pi_context Context)
Definition: pi2ur.hpp:1575
pi2ur::piProgramBuild
pi_result piProgramBuild(pi_program Program, pi_uint32 NumDevices, const pi_device *DeviceList, const char *Options, void(*PFnNotify)(pi_program Program, void *UserData), void *UserData)
Definition: pi2ur.hpp:2028
pi2ur::piextCommandBufferMemBufferCopy
pi_result piextCommandBufferMemBufferCopy(pi_ext_command_buffer CommandBuffer, pi_mem SrcMem, pi_mem DstMem, size_t SrcOffset, size_t DstOffset, size_t Size, pi_uint32 NumSyncPointsInWaitList, const pi_ext_sync_point *SyncPointWaitList, pi_ext_sync_point *SyncPoint)
API to append a mem buffer copy command to the command-buffer.
Definition: pi2ur.hpp:4359
piextEnablePeerAccess
pi_result piextEnablePeerAccess(pi_device command_device, pi_device peer_device)
Definition: pi_cuda.cpp:1163
pi2ur::piextUSMEnqueueMemAdvise
pi_result piextUSMEnqueueMemAdvise(pi_queue Queue, const void *Ptr, size_t Length, pi_mem_advice Advice, pi_event *OutEvent)
USM memadvise API to govern behavior of automatic migration mechanisms.
Definition: pi2ur.hpp:3269
piProgramBuild
pi_result piProgramBuild(pi_program Program, pi_uint32 NumDevices, const pi_device *DeviceList, const char *Options, void(*PFnNotify)(pi_program Program, void *UserData), void *UserData)
Definition: pi_cuda.cpp:296
pi_image_region_struct
Definition: pi.h:1043
pi2ur::piEnqueueMemBufferRead
pi_result piEnqueueMemBufferRead(pi_queue Queue, pi_mem Src, pi_bool BlockingRead, size_t Offset, size_t Size, void *Dst, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Definition: pi2ur.hpp:3861
pi2ur::piextProgramCreateWithNativeHandle
pi_result piextProgramCreateWithNativeHandle(pi_native_handle NativeHandle, pi_context Context, bool OwnNativeHandle, pi_program *Program)
Creates PI program object from a native handle.
Definition: pi2ur.hpp:2310
piextMemImageFree
pi_result piextMemImageFree(pi_context Context, pi_device Device, pi_image_mem_handle MemoryHandle)
API to free memory for bindless images.
Definition: pi_cuda.cpp:411
piEnqueueMemImageRead
pi_result piEnqueueMemImageRead(pi_queue Queue, pi_mem Image, pi_bool BlockingRead, pi_image_offset Origin, pi_image_region Region, size_t RowPitch, size_t SlicePitch, void *Ptr, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
Definition: pi_cuda.cpp:766
piEnqueueMemBufferFill
pi_result piEnqueueMemBufferFill(pi_queue Queue, pi_mem Buffer, const void *Pattern, size_t PatternSize, size_t Offset, size_t Size, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
Definition: pi_cuda.cpp:727
piextMemMipmapFree
pi_result piextMemMipmapFree(pi_context Context, pi_device Device, pi_image_mem_handle MemoryHandle)
API to free mipmap memory for bindless images.
Definition: pi_cuda.cpp:416
_pi_mem_obj_property
Definition: pi.h:1828
_pi_usm_migration_flags
_pi_usm_migration_flags
Definition: pi.h:1886
piKernelSetExecInfo
pi_result piKernelSetExecInfo(pi_kernel Kernel, pi_kernel_exec_info ParamName, size_t ParamValueSize, const void *ParamValue)
API to set attributes controlling kernel execution.
Definition: pi_cuda.cpp:1021
pi2ur::piEnqueueKernelLaunch
pi_result piEnqueueKernelLaunch(pi_queue Queue, pi_kernel Kernel, pi_uint32 WorkDim, const size_t *GlobalWorkOffset, const size_t *GlobalWorkSize, const size_t *LocalWorkSize, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Definition: pi2ur.hpp:3508
pi2ur::piEventGetInfo
pi_result piEventGetInfo(pi_event Event, pi_event_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi2ur.hpp:3979
piextUSMEnqueueMemcpy2D
pi_result piextUSMEnqueueMemcpy2D(pi_queue Queue, pi_bool Blocking, void *DstPtr, size_t DstPitch, const void *SrcPtr, size_t SrcPitch, size_t Width, size_t Height, pi_uint32 NumEventsInWaitlist, const pi_event *EventWaitlist, pi_event *Event)
USM 2D Memcpy API.
Definition: pi_cuda.cpp:934
die
void die(const char *Message)
Definition: ur.hpp:52
_pi_program_info
_pi_program_info
Definition: pi.h:436
pi2ur::piKernelRetain
pi_result piKernelRetain(pi_kernel Kernel)
Definition: pi2ur.hpp:2428
_pi_profiling_info
_pi_profiling_info
Definition: pi.h:683
_pi_plugin::PiFunctionTable
struct _pi_plugin::FunctionPointers PiFunctionTable
pi2ur::piextMemMipmapFree
pi_result piextMemMipmapFree(pi_context Context, pi_device Device, pi_image_mem_handle MemoryHandle)
API to free mipmap memory for bindless images.
Definition: pi2ur.hpp:4775
pi_interop_semaphore_handle
pi_uint64 pi_interop_semaphore_handle
Definition: pi.h:1094
piextKernelSetArgMemObj
pi_result piextKernelSetArgMemObj(pi_kernel Kernel, pi_uint32 ArgIndex, const pi_mem_obj_property *ArgProperties, const pi_mem *ArgValue)
Definition: pi_cuda.cpp:347
piKernelGetGroupInfo
pi_result piKernelGetGroupInfo(pi_kernel Kernel, pi_device Device, pi_kernel_group_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi_cuda.cpp:502
pi2ur::piextPeerAccessGetInfo
pi_result piextPeerAccessGetInfo(pi_device command_device, pi_device peer_device, pi_peer_attr attr, size_t param_value_size, void *param_value, size_t *param_value_size_ret)
Definition: pi2ur.hpp:4549
pi2ur::piextPlatformGetNativeHandle
pi_result piextPlatformGetNativeHandle(pi_platform Platform, pi_native_handle *NativeHandle)
Gets the native handle of a PI platform object.
Definition: pi2ur.hpp:820
piextQueueGetNativeHandle
pi_result piextQueueGetNativeHandle(pi_queue Queue, pi_native_handle *NativeHandle, int32_t *NativeHandleDesc)
Gets the native handle of a PI queue object.
Definition: pi_cuda.cpp:185
pi2ur::piextContextSetExtendedDeleter
pi_result piextContextSetExtendedDeleter(pi_context Context, pi_context_extended_deleter Function, void *UserData)
Definition: pi2ur.hpp:1477
piProgramCompile
pi_result piProgramCompile(pi_program Program, pi_uint32 NumDevices, const pi_device *DeviceList, const char *Options, pi_uint32 NumInputHeaders, const pi_program *InputHeaders, const char **HeaderIncludeNames, void(*PFnNotify)(pi_program Program, void *UserData), void *UserData)
Definition: pi_cuda.cpp:285
piDevicesGet
pi_result piDevicesGet(pi_platform Platform, pi_device_type DeviceType, pi_uint32 NumEntries, pi_device *Devices, pi_uint32 *NumDevices)
Definition: pi_cuda.cpp:58
pi2ur::piProgramCreateWithBinary
pi_result piProgramCreateWithBinary(pi_context Context, pi_uint32 NumDevices, const pi_device *DeviceList, const size_t *Lengths, const unsigned char **Binaries, size_t NumMetadataEntries, const pi_device_binary_property *Metadata, pi_int32 *BinaryStatus, pi_program *Program)
Creates a PI program for a context and loads the given binary into it.
Definition: pi2ur.hpp:1855
piEventSetStatus
pi_result piEventSetStatus(pi_event Event, pi_int32 ExecutionStatus)
Definition: pi_cuda.cpp:588
piextProgramCreateWithNativeHandle
pi_result piextProgramCreateWithNativeHandle(pi_native_handle NativeHandle, pi_context Context, bool OwnNativeHandle, pi_program *Program)
Creates PI program object from a native handle.
Definition: pi_cuda.cpp:327
_pi_kernel_group_info
_pi_kernel_group_info
Definition: pi.h:486
piKernelSetArg
pi_result piKernelSetArg(pi_kernel Kernel, pi_uint32 ArgIndex, size_t ArgSize, const void *ArgValue)
Definition: pi_cuda.cpp:341
pi2ur::piPluginGetBackendOption
pi_result piPluginGetBackendOption(pi_platform Platform, const char *FrontendOption, const char **PlatformOption)
API to get backend specific option.
Definition: pi2ur.hpp:914
pi2ur::piextContextCreateWithNativeHandle
pi_result piextContextCreateWithNativeHandle(pi_native_handle NativeHandle, pi_uint32 NumDevices, const pi_device *Devices, bool OwnNativeHandle, pi_context *RetContext)
Creates PI context object from a native handle.
Definition: pi2ur.hpp:1497
_pi_peer_attr
_pi_peer_attr
Definition: pi.h:1119
piextMemImageCopy
pi_result piextMemImageCopy(pi_queue Queue, void *DstPtr, void *SrcPtr, const pi_image_format *ImageFormat, const pi_image_desc *ImageDesc, const pi_image_copy_flags Flags, pi_image_offset SrcOffset, pi_image_offset DstOffset, pi_image_region CopyExtent, pi_image_region HostExtent, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
API to copy image data Host to Device or Device to Host.
Definition: pi_cuda.cpp:421
piKernelRelease
pi_result piKernelRelease(pi_kernel Kernel)
Definition: pi_cuda.cpp:525
pi2ur::piEnqueueMemBufferFill
pi_result piEnqueueMemBufferFill(pi_queue Queue, pi_mem Buffer, const void *Pattern, size_t PatternSize, size_t Offset, size_t Size, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Definition: pi2ur.hpp:3643
piEventSetCallback
pi_result piEventSetCallback(pi_event Event, pi_int32 CommandExecCallbackType, void(*PFnNotify)(pi_event Event, pi_int32 EventCommandStatus, void *UserData), void *UserData)
Definition: pi_cuda.cpp:579
pi2ur::piextUSMSharedAlloc
pi_result piextUSMSharedAlloc(void **ResultPtr, pi_context Context, pi_device Device, pi_usm_mem_properties *Properties, size_t Size, pi_uint32 Alignment)
Allocates memory accessible on both host and device.
Definition: pi2ur.hpp:3148
piextEnqueueDeviceGlobalVariableWrite
pi_result piextEnqueueDeviceGlobalVariableWrite(pi_queue Queue, pi_program Program, const char *Name, pi_bool BlockingWrite, size_t Count, size_t Offset, const void *Src, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *Event)
Device global variable.
Definition: pi_cuda.cpp:961
piMemBufferCreate
pi_result piMemBufferCreate(pi_context Context, pi_mem_flags Flags, size_t Size, void *HostPtr, pi_mem *RetMem, const pi_mem_properties *properties)
Definition: pi_cuda.cpp:205
piextUSMEnqueuePrefetch
pi_result piextUSMEnqueuePrefetch(pi_queue Queue, const void *Ptr, size_t Size, pi_usm_migration_flags Flags, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *OutEvent)
Hint to migrate memory to the device.
Definition: pi_cuda.cpp:892
piEventsWait
pi_result piEventsWait(pi_uint32 NumEvents, const pi_event *EventList)
Definition: pi_cuda.cpp:575
_pi_mem_alloc_info
_pi_mem_alloc_info
Definition: pi.h:1869
pi2ur::piextUSMImport
pi_result piextUSMImport(const void *HostPtr, size_t Size, pi_context Context)
Import host system memory into USM.
Definition: pi2ur.hpp:3393
pi2ur::piextUSMEnqueueMemset
pi_result piextUSMEnqueueMemset(pi_queue Queue, void *Ptr, pi_int32 Value, size_t Count, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
USM Memset API.
Definition: pi2ur.hpp:3665
pi_usm_mem_properties
pi_bitfield pi_usm_mem_properties
Definition: pi.h:716
pi_map_flags
pi_bitfield pi_map_flags
Definition: pi.h:704
piextCommandBufferRelease
pi_result piextCommandBufferRelease(pi_ext_command_buffer CommandBuffer)
API to decrement the reference count of the command-buffer.
Definition: pi_cuda.cpp:1047
piextBindlessImageSamplerCreate
pi_result piextBindlessImageSamplerCreate(pi_context Context, const pi_sampler_properties *SamplerProperties, float MinMipmapLevelClamp, float MaxMipmapLevelClamp, float MaxAnisotropy, pi_sampler *RetSampler)
API to create samplers for bindless images.
Definition: pi_cuda.cpp:394
_pi_program_build_info
_pi_program_build_info
Definition: pi.h:229
piextQueueCreateWithNativeHandle
pi_result piextQueueCreateWithNativeHandle(pi_native_handle NativeHandle, int32_t NativeHandleDesc, pi_context Context, pi_device Device, bool OwnNativeHandle, pi_queue_properties *Properties, pi_queue *Queue)
Creates PI queue object from a native handle.
Definition: pi_cuda.cpp:193
pi2ur::piEnqueueEventsWaitWithBarrier
pi_result piEnqueueEventsWaitWithBarrier(pi_queue Queue, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Definition: pi2ur.hpp:3884
piPlatformsGet
pi_result piPlatformsGet(pi_uint32 NumEntries, pi_platform *Platforms, pi_uint32 *NumPlatforms)
Definition: pi_cuda.cpp:25
pi2ur::piextEnablePeerAccess
pi_result piextEnablePeerAccess(pi_device command_device, pi_device peer_device)
Definition: pi2ur.hpp:4528
piContextRetain
pi_result piContextRetain(pi_context Context)
Definition: pi_cuda.cpp:147
pi_device_partition_property
intptr_t pi_device_partition_property
Definition: pi.h:788
piextUSMFree
pi_result piextUSMFree(pi_context Context, void *Ptr)
Indicates that the allocated USM memory is no longer needed on the runtime side.
Definition: pi_cuda.cpp:863
pi2ur::piKernelGetSubGroupInfo
pi_result piKernelGetSubGroupInfo(pi_kernel Kernel, pi_device Device, pi_kernel_sub_group_info ParamName, size_t InputValueSize, const void *InputValue, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
API to query information from the sub-group from a kernel.
Definition: pi2ur.hpp:2471
piEventRetain
pi_result piEventRetain(pi_event Event)
Definition: pi_cuda.cpp:592
piEnqueueMemBufferRead
pi_result piEnqueueMemBufferRead(pi_queue Queue, pi_mem Src, pi_bool BlockingRead, size_t Offset, size_t Size, void *Dst, pi_uint32 NumEventsInWaitList, const pi_event *EventWaitList, pi_event *Event)
Definition: pi_cuda.cpp:651
pi2ur::piMemRelease
pi_result piMemRelease(pi_mem Mem)
Definition: pi2ur.hpp:3213
pi2ur::piEnqueueMemUnmap
pi_result piEnqueueMemUnmap(pi_queue Queue, pi_mem Mem, void *MappedPtr, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
Definition: pi2ur.hpp:3621
pi_int32
int32_t pi_int32
Definition: pi.h:193
_pi_context
Definition: pi_cuda.hpp:52
pi2ur::piEventSetCallback
pi_result piEventSetCallback(pi_event Event, pi_int32 CommandExecCallbackType, void(*PFnNotify)(pi_event Event, pi_int32 EventCommandStatus, void *UserData), void *UserData)
Definition: pi2ur.hpp:4100
PI_QUEUE_FLAGS
constexpr pi_queue_properties PI_QUEUE_FLAGS
Definition: pi.h:730
_pi_device
Definition: pi_cuda.hpp:48
_pi_kernel_sub_group_info
_pi_kernel_sub_group_info
Definition: pi.h:507
PI_ASSERT
#define PI_ASSERT(condition, error)
Definition: pi2ur.hpp:150
piextKernelGetNativeHandle
pi_result piextKernelGetNativeHandle(pi_kernel Kernel, pi_native_handle *NativeHandle)
Gets the native handle of a PI kernel object.
Definition: pi_cuda.cpp:551
piKernelRetain
pi_result piKernelRetain(pi_kernel Kernel)
Definition: pi_cuda.cpp:520
pi2ur::piContextCreate
pi_result piContextCreate(const pi_context_properties *Properties, pi_uint32 NumDevices, const pi_device *Devices, void(*PFnNotify)(const char *ErrInfo, const void *PrivateInfo, size_t CB, void *UserData), void *UserData, pi_context *RetContext)
Definition: pi2ur.hpp:1457
piSamplerGetInfo
pi_result piSamplerGetInfo(pi_sampler Sampler, pi_sampler_info ParamName, size_t ParamValueSize, void *ParamValue, size_t *ParamValueSizeRet)
Definition: pi_cuda.cpp:618
pi2ur::piextEnqueueDeviceGlobalVariableWrite
pi_result piextEnqueueDeviceGlobalVariableWrite(pi_queue Queue, pi_program Program, const char *Name, pi_bool BlockingWrite, size_t Count, size_t Offset, const void *Src, pi_uint32 NumEventsInWaitList, const pi_event *EventsWaitList, pi_event *OutEvent)
API for writing data from host to a device global variable.
Definition: pi2ur.hpp:2575
pi2ur::piextKernelSetArgSampler
pi_result piextKernelSetArgSampler(pi_kernel Kernel, pi_uint32 ArgIndex, const pi_sampler *ArgValue)
Definition: pi2ur.hpp:4242