Harmony18090's picture
Add source batch 2/11
76f9669 verified
raw
history blame
104 kB
# SPDX-FileCopyrightText: Copyright (c) 2021-2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: LicenseRef-NVIDIA-SOFTWARE-LICENSE
# This code was automatically generated with version 12.9.0. Do not modify it directly.
include "../cyruntime_functions.pxi"
import os
cimport cuda.bindings._bindings.cyruntime_ptds as ptds
cimport cython
cdef bint __cudaPythonInit = False
cdef bint __usePTDS = False
cdef int _cudaPythonInit() except -1 nogil:
global __cudaPythonInit
global __usePTDS
with gil:
__usePTDS = os.getenv('CUDA_PYTHON_CUDA_PER_THREAD_DEFAULT_STREAM', default=False)
__cudaPythonInit = True
return __usePTDS
# Create a very small function to check whether we are init'ed, so the C
# compiler can inline it.
cdef inline int cudaPythonInit() except -1 nogil:
if __cudaPythonInit:
return __usePTDS
return _cudaPythonInit()
cdef cudaError_t _cudaDeviceReset() except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceReset()
return cudaDeviceReset()
cdef cudaError_t _cudaDeviceSynchronize() except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceSynchronize()
return cudaDeviceSynchronize()
cdef cudaError_t _cudaDeviceSetLimit(cudaLimit limit, size_t value) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceSetLimit(limit, value)
return cudaDeviceSetLimit(limit, value)
cdef cudaError_t _cudaDeviceGetLimit(size_t* pValue, cudaLimit limit) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceGetLimit(pValue, limit)
return cudaDeviceGetLimit(pValue, limit)
cdef cudaError_t _cudaDeviceGetTexture1DLinearMaxWidth(size_t* maxWidthInElements, const cudaChannelFormatDesc* fmtDesc, int device) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceGetTexture1DLinearMaxWidth(maxWidthInElements, fmtDesc, device)
return cudaDeviceGetTexture1DLinearMaxWidth(maxWidthInElements, fmtDesc, device)
cdef cudaError_t _cudaDeviceGetCacheConfig(cudaFuncCache* pCacheConfig) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceGetCacheConfig(pCacheConfig)
return cudaDeviceGetCacheConfig(pCacheConfig)
cdef cudaError_t _cudaDeviceGetStreamPriorityRange(int* leastPriority, int* greatestPriority) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceGetStreamPriorityRange(leastPriority, greatestPriority)
return cudaDeviceGetStreamPriorityRange(leastPriority, greatestPriority)
cdef cudaError_t _cudaDeviceSetCacheConfig(cudaFuncCache cacheConfig) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceSetCacheConfig(cacheConfig)
return cudaDeviceSetCacheConfig(cacheConfig)
cdef cudaError_t _cudaDeviceGetByPCIBusId(int* device, const char* pciBusId) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceGetByPCIBusId(device, pciBusId)
return cudaDeviceGetByPCIBusId(device, pciBusId)
cdef cudaError_t _cudaDeviceGetPCIBusId(char* pciBusId, int length, int device) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceGetPCIBusId(pciBusId, length, device)
return cudaDeviceGetPCIBusId(pciBusId, length, device)
cdef cudaError_t _cudaIpcGetEventHandle(cudaIpcEventHandle_t* handle, cudaEvent_t event) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaIpcGetEventHandle(handle, event)
return cudaIpcGetEventHandle(handle, event)
cdef cudaError_t _cudaIpcOpenEventHandle(cudaEvent_t* event, cudaIpcEventHandle_t handle) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaIpcOpenEventHandle(event, handle)
return cudaIpcOpenEventHandle(event, handle)
cdef cudaError_t _cudaIpcGetMemHandle(cudaIpcMemHandle_t* handle, void* devPtr) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaIpcGetMemHandle(handle, devPtr)
return cudaIpcGetMemHandle(handle, devPtr)
cdef cudaError_t _cudaIpcOpenMemHandle(void** devPtr, cudaIpcMemHandle_t handle, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaIpcOpenMemHandle(devPtr, handle, flags)
return cudaIpcOpenMemHandle(devPtr, handle, flags)
cdef cudaError_t _cudaIpcCloseMemHandle(void* devPtr) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaIpcCloseMemHandle(devPtr)
return cudaIpcCloseMemHandle(devPtr)
cdef cudaError_t _cudaDeviceFlushGPUDirectRDMAWrites(cudaFlushGPUDirectRDMAWritesTarget target, cudaFlushGPUDirectRDMAWritesScope scope) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceFlushGPUDirectRDMAWrites(target, scope)
return cudaDeviceFlushGPUDirectRDMAWrites(target, scope)
cdef cudaError_t _cudaDeviceRegisterAsyncNotification(int device, cudaAsyncCallback callbackFunc, void* userData, cudaAsyncCallbackHandle_t* callback) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceRegisterAsyncNotification(device, callbackFunc, userData, callback)
return cudaDeviceRegisterAsyncNotification(device, callbackFunc, userData, callback)
cdef cudaError_t _cudaDeviceUnregisterAsyncNotification(int device, cudaAsyncCallbackHandle_t callback) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceUnregisterAsyncNotification(device, callback)
return cudaDeviceUnregisterAsyncNotification(device, callback)
cdef cudaError_t _cudaDeviceGetSharedMemConfig(cudaSharedMemConfig* pConfig) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceGetSharedMemConfig(pConfig)
return cudaDeviceGetSharedMemConfig(pConfig)
cdef cudaError_t _cudaDeviceSetSharedMemConfig(cudaSharedMemConfig config) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceSetSharedMemConfig(config)
return cudaDeviceSetSharedMemConfig(config)
cdef cudaError_t _cudaGetLastError() except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetLastError()
return cudaGetLastError()
cdef cudaError_t _cudaPeekAtLastError() except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaPeekAtLastError()
return cudaPeekAtLastError()
cdef const char* _cudaGetErrorName(cudaError_t error) except ?NULL nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetErrorName(error)
return cudaGetErrorName(error)
cdef const char* _cudaGetErrorString(cudaError_t error) except ?NULL nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetErrorString(error)
return cudaGetErrorString(error)
cdef cudaError_t _cudaGetDeviceCount(int* count) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetDeviceCount(count)
return cudaGetDeviceCount(count)
cdef cudaError_t _cudaGetDeviceProperties_v2(cudaDeviceProp* prop, int device) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetDeviceProperties_v2(prop, device)
return cudaGetDeviceProperties_v2(prop, device)
cdef cudaError_t _cudaDeviceGetAttribute(int* value, cudaDeviceAttr attr, int device) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceGetAttribute(value, attr, device)
return cudaDeviceGetAttribute(value, attr, device)
cdef cudaError_t _cudaDeviceGetDefaultMemPool(cudaMemPool_t* memPool, int device) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceGetDefaultMemPool(memPool, device)
return cudaDeviceGetDefaultMemPool(memPool, device)
cdef cudaError_t _cudaDeviceSetMemPool(int device, cudaMemPool_t memPool) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceSetMemPool(device, memPool)
return cudaDeviceSetMemPool(device, memPool)
cdef cudaError_t _cudaDeviceGetMemPool(cudaMemPool_t* memPool, int device) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceGetMemPool(memPool, device)
return cudaDeviceGetMemPool(memPool, device)
cdef cudaError_t _cudaDeviceGetNvSciSyncAttributes(void* nvSciSyncAttrList, int device, int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceGetNvSciSyncAttributes(nvSciSyncAttrList, device, flags)
return cudaDeviceGetNvSciSyncAttributes(nvSciSyncAttrList, device, flags)
cdef cudaError_t _cudaDeviceGetP2PAttribute(int* value, cudaDeviceP2PAttr attr, int srcDevice, int dstDevice) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceGetP2PAttribute(value, attr, srcDevice, dstDevice)
return cudaDeviceGetP2PAttribute(value, attr, srcDevice, dstDevice)
cdef cudaError_t _cudaChooseDevice(int* device, const cudaDeviceProp* prop) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaChooseDevice(device, prop)
return cudaChooseDevice(device, prop)
cdef cudaError_t _cudaInitDevice(int device, unsigned int deviceFlags, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaInitDevice(device, deviceFlags, flags)
return cudaInitDevice(device, deviceFlags, flags)
cdef cudaError_t _cudaSetDevice(int device) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaSetDevice(device)
return cudaSetDevice(device)
cdef cudaError_t _cudaGetDevice(int* device) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetDevice(device)
return cudaGetDevice(device)
cdef cudaError_t _cudaSetDeviceFlags(unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaSetDeviceFlags(flags)
return cudaSetDeviceFlags(flags)
cdef cudaError_t _cudaGetDeviceFlags(unsigned int* flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetDeviceFlags(flags)
return cudaGetDeviceFlags(flags)
cdef cudaError_t _cudaStreamCreate(cudaStream_t* pStream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamCreate(pStream)
return cudaStreamCreate(pStream)
cdef cudaError_t _cudaStreamCreateWithFlags(cudaStream_t* pStream, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamCreateWithFlags(pStream, flags)
return cudaStreamCreateWithFlags(pStream, flags)
cdef cudaError_t _cudaStreamCreateWithPriority(cudaStream_t* pStream, unsigned int flags, int priority) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamCreateWithPriority(pStream, flags, priority)
return cudaStreamCreateWithPriority(pStream, flags, priority)
cdef cudaError_t _cudaStreamGetPriority(cudaStream_t hStream, int* priority) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamGetPriority(hStream, priority)
return cudaStreamGetPriority(hStream, priority)
cdef cudaError_t _cudaStreamGetFlags(cudaStream_t hStream, unsigned int* flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamGetFlags(hStream, flags)
return cudaStreamGetFlags(hStream, flags)
cdef cudaError_t _cudaStreamGetId(cudaStream_t hStream, unsigned long long* streamId) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamGetId(hStream, streamId)
return cudaStreamGetId(hStream, streamId)
cdef cudaError_t _cudaStreamGetDevice(cudaStream_t hStream, int* device) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamGetDevice(hStream, device)
return cudaStreamGetDevice(hStream, device)
cdef cudaError_t _cudaCtxResetPersistingL2Cache() except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaCtxResetPersistingL2Cache()
return cudaCtxResetPersistingL2Cache()
cdef cudaError_t _cudaStreamCopyAttributes(cudaStream_t dst, cudaStream_t src) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamCopyAttributes(dst, src)
return cudaStreamCopyAttributes(dst, src)
cdef cudaError_t _cudaStreamGetAttribute(cudaStream_t hStream, cudaStreamAttrID attr, cudaStreamAttrValue* value_out) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamGetAttribute(hStream, attr, value_out)
return cudaStreamGetAttribute(hStream, attr, value_out)
cdef cudaError_t _cudaStreamSetAttribute(cudaStream_t hStream, cudaStreamAttrID attr, const cudaStreamAttrValue* value) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamSetAttribute(hStream, attr, value)
return cudaStreamSetAttribute(hStream, attr, value)
cdef cudaError_t _cudaStreamDestroy(cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamDestroy(stream)
return cudaStreamDestroy(stream)
cdef cudaError_t _cudaStreamWaitEvent(cudaStream_t stream, cudaEvent_t event, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamWaitEvent(stream, event, flags)
return cudaStreamWaitEvent(stream, event, flags)
cdef cudaError_t _cudaStreamAddCallback(cudaStream_t stream, cudaStreamCallback_t callback, void* userData, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamAddCallback(stream, callback, userData, flags)
return cudaStreamAddCallback(stream, callback, userData, flags)
cdef cudaError_t _cudaStreamSynchronize(cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamSynchronize(stream)
return cudaStreamSynchronize(stream)
cdef cudaError_t _cudaStreamQuery(cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamQuery(stream)
return cudaStreamQuery(stream)
cdef cudaError_t _cudaStreamAttachMemAsync(cudaStream_t stream, void* devPtr, size_t length, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamAttachMemAsync(stream, devPtr, length, flags)
return cudaStreamAttachMemAsync(stream, devPtr, length, flags)
cdef cudaError_t _cudaStreamBeginCapture(cudaStream_t stream, cudaStreamCaptureMode mode) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamBeginCapture(stream, mode)
return cudaStreamBeginCapture(stream, mode)
cdef cudaError_t _cudaStreamBeginCaptureToGraph(cudaStream_t stream, cudaGraph_t graph, const cudaGraphNode_t* dependencies, const cudaGraphEdgeData* dependencyData, size_t numDependencies, cudaStreamCaptureMode mode) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamBeginCaptureToGraph(stream, graph, dependencies, dependencyData, numDependencies, mode)
return cudaStreamBeginCaptureToGraph(stream, graph, dependencies, dependencyData, numDependencies, mode)
cdef cudaError_t _cudaThreadExchangeStreamCaptureMode(cudaStreamCaptureMode* mode) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaThreadExchangeStreamCaptureMode(mode)
return cudaThreadExchangeStreamCaptureMode(mode)
cdef cudaError_t _cudaStreamEndCapture(cudaStream_t stream, cudaGraph_t* pGraph) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamEndCapture(stream, pGraph)
return cudaStreamEndCapture(stream, pGraph)
cdef cudaError_t _cudaStreamIsCapturing(cudaStream_t stream, cudaStreamCaptureStatus* pCaptureStatus) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamIsCapturing(stream, pCaptureStatus)
return cudaStreamIsCapturing(stream, pCaptureStatus)
cdef cudaError_t _cudaStreamGetCaptureInfo_v2(cudaStream_t stream, cudaStreamCaptureStatus* captureStatus_out, unsigned long long* id_out, cudaGraph_t* graph_out, const cudaGraphNode_t** dependencies_out, size_t* numDependencies_out) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamGetCaptureInfo_v2(stream, captureStatus_out, id_out, graph_out, dependencies_out, numDependencies_out)
return cudaStreamGetCaptureInfo_v2(stream, captureStatus_out, id_out, graph_out, dependencies_out, numDependencies_out)
cdef cudaError_t _cudaStreamGetCaptureInfo_v3(cudaStream_t stream, cudaStreamCaptureStatus* captureStatus_out, unsigned long long* id_out, cudaGraph_t* graph_out, const cudaGraphNode_t** dependencies_out, const cudaGraphEdgeData** edgeData_out, size_t* numDependencies_out) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamGetCaptureInfo_v3(stream, captureStatus_out, id_out, graph_out, dependencies_out, edgeData_out, numDependencies_out)
return cudaStreamGetCaptureInfo_v3(stream, captureStatus_out, id_out, graph_out, dependencies_out, edgeData_out, numDependencies_out)
cdef cudaError_t _cudaStreamUpdateCaptureDependencies(cudaStream_t stream, cudaGraphNode_t* dependencies, size_t numDependencies, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamUpdateCaptureDependencies(stream, dependencies, numDependencies, flags)
return cudaStreamUpdateCaptureDependencies(stream, dependencies, numDependencies, flags)
cdef cudaError_t _cudaStreamUpdateCaptureDependencies_v2(cudaStream_t stream, cudaGraphNode_t* dependencies, const cudaGraphEdgeData* dependencyData, size_t numDependencies, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaStreamUpdateCaptureDependencies_v2(stream, dependencies, dependencyData, numDependencies, flags)
return cudaStreamUpdateCaptureDependencies_v2(stream, dependencies, dependencyData, numDependencies, flags)
cdef cudaError_t _cudaEventCreate(cudaEvent_t* event) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaEventCreate(event)
return cudaEventCreate(event)
cdef cudaError_t _cudaEventCreateWithFlags(cudaEvent_t* event, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaEventCreateWithFlags(event, flags)
return cudaEventCreateWithFlags(event, flags)
cdef cudaError_t _cudaEventRecord(cudaEvent_t event, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaEventRecord(event, stream)
return cudaEventRecord(event, stream)
cdef cudaError_t _cudaEventRecordWithFlags(cudaEvent_t event, cudaStream_t stream, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaEventRecordWithFlags(event, stream, flags)
return cudaEventRecordWithFlags(event, stream, flags)
cdef cudaError_t _cudaEventQuery(cudaEvent_t event) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaEventQuery(event)
return cudaEventQuery(event)
cdef cudaError_t _cudaEventSynchronize(cudaEvent_t event) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaEventSynchronize(event)
return cudaEventSynchronize(event)
cdef cudaError_t _cudaEventDestroy(cudaEvent_t event) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaEventDestroy(event)
return cudaEventDestroy(event)
cdef cudaError_t _cudaEventElapsedTime(float* ms, cudaEvent_t start, cudaEvent_t end) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaEventElapsedTime(ms, start, end)
return cudaEventElapsedTime(ms, start, end)
cdef cudaError_t _cudaEventElapsedTime_v2(float* ms, cudaEvent_t start, cudaEvent_t end) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaEventElapsedTime_v2(ms, start, end)
return cudaEventElapsedTime_v2(ms, start, end)
cdef cudaError_t _cudaImportExternalMemory(cudaExternalMemory_t* extMem_out, const cudaExternalMemoryHandleDesc* memHandleDesc) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaImportExternalMemory(extMem_out, memHandleDesc)
return cudaImportExternalMemory(extMem_out, memHandleDesc)
cdef cudaError_t _cudaExternalMemoryGetMappedBuffer(void** devPtr, cudaExternalMemory_t extMem, const cudaExternalMemoryBufferDesc* bufferDesc) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaExternalMemoryGetMappedBuffer(devPtr, extMem, bufferDesc)
return cudaExternalMemoryGetMappedBuffer(devPtr, extMem, bufferDesc)
cdef cudaError_t _cudaExternalMemoryGetMappedMipmappedArray(cudaMipmappedArray_t* mipmap, cudaExternalMemory_t extMem, const cudaExternalMemoryMipmappedArrayDesc* mipmapDesc) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaExternalMemoryGetMappedMipmappedArray(mipmap, extMem, mipmapDesc)
return cudaExternalMemoryGetMappedMipmappedArray(mipmap, extMem, mipmapDesc)
cdef cudaError_t _cudaDestroyExternalMemory(cudaExternalMemory_t extMem) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDestroyExternalMemory(extMem)
return cudaDestroyExternalMemory(extMem)
cdef cudaError_t _cudaImportExternalSemaphore(cudaExternalSemaphore_t* extSem_out, const cudaExternalSemaphoreHandleDesc* semHandleDesc) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaImportExternalSemaphore(extSem_out, semHandleDesc)
return cudaImportExternalSemaphore(extSem_out, semHandleDesc)
cdef cudaError_t _cudaSignalExternalSemaphoresAsync_v2(const cudaExternalSemaphore_t* extSemArray, const cudaExternalSemaphoreSignalParams* paramsArray, unsigned int numExtSems, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaSignalExternalSemaphoresAsync_v2(extSemArray, paramsArray, numExtSems, stream)
return cudaSignalExternalSemaphoresAsync_v2(extSemArray, paramsArray, numExtSems, stream)
cdef cudaError_t _cudaWaitExternalSemaphoresAsync_v2(const cudaExternalSemaphore_t* extSemArray, const cudaExternalSemaphoreWaitParams* paramsArray, unsigned int numExtSems, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaWaitExternalSemaphoresAsync_v2(extSemArray, paramsArray, numExtSems, stream)
return cudaWaitExternalSemaphoresAsync_v2(extSemArray, paramsArray, numExtSems, stream)
cdef cudaError_t _cudaDestroyExternalSemaphore(cudaExternalSemaphore_t extSem) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDestroyExternalSemaphore(extSem)
return cudaDestroyExternalSemaphore(extSem)
cdef cudaError_t _cudaFuncSetCacheConfig(const void* func, cudaFuncCache cacheConfig) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaFuncSetCacheConfig(func, cacheConfig)
return cudaFuncSetCacheConfig(func, cacheConfig)
cdef cudaError_t _cudaFuncGetAttributes(cudaFuncAttributes* attr, const void* func) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaFuncGetAttributes(attr, func)
return cudaFuncGetAttributes(attr, func)
cdef cudaError_t _cudaFuncSetAttribute(const void* func, cudaFuncAttribute attr, int value) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaFuncSetAttribute(func, attr, value)
return cudaFuncSetAttribute(func, attr, value)
cdef cudaError_t _cudaLaunchHostFunc(cudaStream_t stream, cudaHostFn_t fn, void* userData) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaLaunchHostFunc(stream, fn, userData)
return cudaLaunchHostFunc(stream, fn, userData)
cdef cudaError_t _cudaFuncSetSharedMemConfig(const void* func, cudaSharedMemConfig config) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaFuncSetSharedMemConfig(func, config)
return cudaFuncSetSharedMemConfig(func, config)
cdef cudaError_t _cudaOccupancyMaxActiveBlocksPerMultiprocessor(int* numBlocks, const void* func, int blockSize, size_t dynamicSMemSize) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaOccupancyMaxActiveBlocksPerMultiprocessor(numBlocks, func, blockSize, dynamicSMemSize)
return cudaOccupancyMaxActiveBlocksPerMultiprocessor(numBlocks, func, blockSize, dynamicSMemSize)
cdef cudaError_t _cudaOccupancyAvailableDynamicSMemPerBlock(size_t* dynamicSmemSize, const void* func, int numBlocks, int blockSize) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaOccupancyAvailableDynamicSMemPerBlock(dynamicSmemSize, func, numBlocks, blockSize)
return cudaOccupancyAvailableDynamicSMemPerBlock(dynamicSmemSize, func, numBlocks, blockSize)
cdef cudaError_t _cudaOccupancyMaxActiveBlocksPerMultiprocessorWithFlags(int* numBlocks, const void* func, int blockSize, size_t dynamicSMemSize, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaOccupancyMaxActiveBlocksPerMultiprocessorWithFlags(numBlocks, func, blockSize, dynamicSMemSize, flags)
return cudaOccupancyMaxActiveBlocksPerMultiprocessorWithFlags(numBlocks, func, blockSize, dynamicSMemSize, flags)
cdef cudaError_t _cudaMallocManaged(void** devPtr, size_t size, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMallocManaged(devPtr, size, flags)
return cudaMallocManaged(devPtr, size, flags)
cdef cudaError_t _cudaMalloc(void** devPtr, size_t size) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMalloc(devPtr, size)
return cudaMalloc(devPtr, size)
cdef cudaError_t _cudaMallocHost(void** ptr, size_t size) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMallocHost(ptr, size)
return cudaMallocHost(ptr, size)
cdef cudaError_t _cudaMallocPitch(void** devPtr, size_t* pitch, size_t width, size_t height) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMallocPitch(devPtr, pitch, width, height)
return cudaMallocPitch(devPtr, pitch, width, height)
cdef cudaError_t _cudaMallocArray(cudaArray_t* array, const cudaChannelFormatDesc* desc, size_t width, size_t height, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMallocArray(array, desc, width, height, flags)
return cudaMallocArray(array, desc, width, height, flags)
cdef cudaError_t _cudaFree(void* devPtr) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaFree(devPtr)
return cudaFree(devPtr)
cdef cudaError_t _cudaFreeHost(void* ptr) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaFreeHost(ptr)
return cudaFreeHost(ptr)
cdef cudaError_t _cudaFreeArray(cudaArray_t array) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaFreeArray(array)
return cudaFreeArray(array)
cdef cudaError_t _cudaFreeMipmappedArray(cudaMipmappedArray_t mipmappedArray) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaFreeMipmappedArray(mipmappedArray)
return cudaFreeMipmappedArray(mipmappedArray)
cdef cudaError_t _cudaHostAlloc(void** pHost, size_t size, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaHostAlloc(pHost, size, flags)
return cudaHostAlloc(pHost, size, flags)
cdef cudaError_t _cudaHostRegister(void* ptr, size_t size, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaHostRegister(ptr, size, flags)
return cudaHostRegister(ptr, size, flags)
cdef cudaError_t _cudaHostUnregister(void* ptr) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaHostUnregister(ptr)
return cudaHostUnregister(ptr)
cdef cudaError_t _cudaHostGetDevicePointer(void** pDevice, void* pHost, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaHostGetDevicePointer(pDevice, pHost, flags)
return cudaHostGetDevicePointer(pDevice, pHost, flags)
cdef cudaError_t _cudaHostGetFlags(unsigned int* pFlags, void* pHost) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaHostGetFlags(pFlags, pHost)
return cudaHostGetFlags(pFlags, pHost)
cdef cudaError_t _cudaMalloc3D(cudaPitchedPtr* pitchedDevPtr, cudaExtent extent) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMalloc3D(pitchedDevPtr, extent)
return cudaMalloc3D(pitchedDevPtr, extent)
cdef cudaError_t _cudaMalloc3DArray(cudaArray_t* array, const cudaChannelFormatDesc* desc, cudaExtent extent, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMalloc3DArray(array, desc, extent, flags)
return cudaMalloc3DArray(array, desc, extent, flags)
cdef cudaError_t _cudaMallocMipmappedArray(cudaMipmappedArray_t* mipmappedArray, const cudaChannelFormatDesc* desc, cudaExtent extent, unsigned int numLevels, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMallocMipmappedArray(mipmappedArray, desc, extent, numLevels, flags)
return cudaMallocMipmappedArray(mipmappedArray, desc, extent, numLevels, flags)
cdef cudaError_t _cudaGetMipmappedArrayLevel(cudaArray_t* levelArray, cudaMipmappedArray_const_t mipmappedArray, unsigned int level) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetMipmappedArrayLevel(levelArray, mipmappedArray, level)
return cudaGetMipmappedArrayLevel(levelArray, mipmappedArray, level)
cdef cudaError_t _cudaMemcpy3D(const cudaMemcpy3DParms* p) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpy3D(p)
return cudaMemcpy3D(p)
cdef cudaError_t _cudaMemcpy3DPeer(const cudaMemcpy3DPeerParms* p) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpy3DPeer(p)
return cudaMemcpy3DPeer(p)
cdef cudaError_t _cudaMemcpy3DAsync(const cudaMemcpy3DParms* p, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpy3DAsync(p, stream)
return cudaMemcpy3DAsync(p, stream)
cdef cudaError_t _cudaMemcpy3DPeerAsync(const cudaMemcpy3DPeerParms* p, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpy3DPeerAsync(p, stream)
return cudaMemcpy3DPeerAsync(p, stream)
cdef cudaError_t _cudaMemGetInfo(size_t* free, size_t* total) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemGetInfo(free, total)
return cudaMemGetInfo(free, total)
cdef cudaError_t _cudaArrayGetInfo(cudaChannelFormatDesc* desc, cudaExtent* extent, unsigned int* flags, cudaArray_t array) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaArrayGetInfo(desc, extent, flags, array)
return cudaArrayGetInfo(desc, extent, flags, array)
cdef cudaError_t _cudaArrayGetPlane(cudaArray_t* pPlaneArray, cudaArray_t hArray, unsigned int planeIdx) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaArrayGetPlane(pPlaneArray, hArray, planeIdx)
return cudaArrayGetPlane(pPlaneArray, hArray, planeIdx)
cdef cudaError_t _cudaArrayGetMemoryRequirements(cudaArrayMemoryRequirements* memoryRequirements, cudaArray_t array, int device) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaArrayGetMemoryRequirements(memoryRequirements, array, device)
return cudaArrayGetMemoryRequirements(memoryRequirements, array, device)
cdef cudaError_t _cudaMipmappedArrayGetMemoryRequirements(cudaArrayMemoryRequirements* memoryRequirements, cudaMipmappedArray_t mipmap, int device) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMipmappedArrayGetMemoryRequirements(memoryRequirements, mipmap, device)
return cudaMipmappedArrayGetMemoryRequirements(memoryRequirements, mipmap, device)
cdef cudaError_t _cudaArrayGetSparseProperties(cudaArraySparseProperties* sparseProperties, cudaArray_t array) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaArrayGetSparseProperties(sparseProperties, array)
return cudaArrayGetSparseProperties(sparseProperties, array)
cdef cudaError_t _cudaMipmappedArrayGetSparseProperties(cudaArraySparseProperties* sparseProperties, cudaMipmappedArray_t mipmap) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMipmappedArrayGetSparseProperties(sparseProperties, mipmap)
return cudaMipmappedArrayGetSparseProperties(sparseProperties, mipmap)
cdef cudaError_t _cudaMemcpy(void* dst, const void* src, size_t count, cudaMemcpyKind kind) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpy(dst, src, count, kind)
return cudaMemcpy(dst, src, count, kind)
cdef cudaError_t _cudaMemcpyPeer(void* dst, int dstDevice, const void* src, int srcDevice, size_t count) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpyPeer(dst, dstDevice, src, srcDevice, count)
return cudaMemcpyPeer(dst, dstDevice, src, srcDevice, count)
cdef cudaError_t _cudaMemcpy2D(void* dst, size_t dpitch, const void* src, size_t spitch, size_t width, size_t height, cudaMemcpyKind kind) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpy2D(dst, dpitch, src, spitch, width, height, kind)
return cudaMemcpy2D(dst, dpitch, src, spitch, width, height, kind)
cdef cudaError_t _cudaMemcpy2DToArray(cudaArray_t dst, size_t wOffset, size_t hOffset, const void* src, size_t spitch, size_t width, size_t height, cudaMemcpyKind kind) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpy2DToArray(dst, wOffset, hOffset, src, spitch, width, height, kind)
return cudaMemcpy2DToArray(dst, wOffset, hOffset, src, spitch, width, height, kind)
cdef cudaError_t _cudaMemcpy2DFromArray(void* dst, size_t dpitch, cudaArray_const_t src, size_t wOffset, size_t hOffset, size_t width, size_t height, cudaMemcpyKind kind) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpy2DFromArray(dst, dpitch, src, wOffset, hOffset, width, height, kind)
return cudaMemcpy2DFromArray(dst, dpitch, src, wOffset, hOffset, width, height, kind)
cdef cudaError_t _cudaMemcpy2DArrayToArray(cudaArray_t dst, size_t wOffsetDst, size_t hOffsetDst, cudaArray_const_t src, size_t wOffsetSrc, size_t hOffsetSrc, size_t width, size_t height, cudaMemcpyKind kind) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpy2DArrayToArray(dst, wOffsetDst, hOffsetDst, src, wOffsetSrc, hOffsetSrc, width, height, kind)
return cudaMemcpy2DArrayToArray(dst, wOffsetDst, hOffsetDst, src, wOffsetSrc, hOffsetSrc, width, height, kind)
cdef cudaError_t _cudaMemcpyAsync(void* dst, const void* src, size_t count, cudaMemcpyKind kind, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpyAsync(dst, src, count, kind, stream)
return cudaMemcpyAsync(dst, src, count, kind, stream)
cdef cudaError_t _cudaMemcpyPeerAsync(void* dst, int dstDevice, const void* src, int srcDevice, size_t count, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpyPeerAsync(dst, dstDevice, src, srcDevice, count, stream)
return cudaMemcpyPeerAsync(dst, dstDevice, src, srcDevice, count, stream)
cdef cudaError_t _cudaMemcpyBatchAsync(void** dsts, void** srcs, size_t* sizes, size_t count, cudaMemcpyAttributes* attrs, size_t* attrsIdxs, size_t numAttrs, size_t* failIdx, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpyBatchAsync(dsts, srcs, sizes, count, attrs, attrsIdxs, numAttrs, failIdx, stream)
return cudaMemcpyBatchAsync(dsts, srcs, sizes, count, attrs, attrsIdxs, numAttrs, failIdx, stream)
cdef cudaError_t _cudaMemcpy3DBatchAsync(size_t numOps, cudaMemcpy3DBatchOp* opList, size_t* failIdx, unsigned long long flags, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpy3DBatchAsync(numOps, opList, failIdx, flags, stream)
return cudaMemcpy3DBatchAsync(numOps, opList, failIdx, flags, stream)
cdef cudaError_t _cudaMemcpy2DAsync(void* dst, size_t dpitch, const void* src, size_t spitch, size_t width, size_t height, cudaMemcpyKind kind, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpy2DAsync(dst, dpitch, src, spitch, width, height, kind, stream)
return cudaMemcpy2DAsync(dst, dpitch, src, spitch, width, height, kind, stream)
cdef cudaError_t _cudaMemcpy2DToArrayAsync(cudaArray_t dst, size_t wOffset, size_t hOffset, const void* src, size_t spitch, size_t width, size_t height, cudaMemcpyKind kind, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpy2DToArrayAsync(dst, wOffset, hOffset, src, spitch, width, height, kind, stream)
return cudaMemcpy2DToArrayAsync(dst, wOffset, hOffset, src, spitch, width, height, kind, stream)
cdef cudaError_t _cudaMemcpy2DFromArrayAsync(void* dst, size_t dpitch, cudaArray_const_t src, size_t wOffset, size_t hOffset, size_t width, size_t height, cudaMemcpyKind kind, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpy2DFromArrayAsync(dst, dpitch, src, wOffset, hOffset, width, height, kind, stream)
return cudaMemcpy2DFromArrayAsync(dst, dpitch, src, wOffset, hOffset, width, height, kind, stream)
cdef cudaError_t _cudaMemset(void* devPtr, int value, size_t count) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemset(devPtr, value, count)
return cudaMemset(devPtr, value, count)
cdef cudaError_t _cudaMemset2D(void* devPtr, size_t pitch, int value, size_t width, size_t height) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemset2D(devPtr, pitch, value, width, height)
return cudaMemset2D(devPtr, pitch, value, width, height)
cdef cudaError_t _cudaMemset3D(cudaPitchedPtr pitchedDevPtr, int value, cudaExtent extent) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemset3D(pitchedDevPtr, value, extent)
return cudaMemset3D(pitchedDevPtr, value, extent)
cdef cudaError_t _cudaMemsetAsync(void* devPtr, int value, size_t count, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemsetAsync(devPtr, value, count, stream)
return cudaMemsetAsync(devPtr, value, count, stream)
cdef cudaError_t _cudaMemset2DAsync(void* devPtr, size_t pitch, int value, size_t width, size_t height, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemset2DAsync(devPtr, pitch, value, width, height, stream)
return cudaMemset2DAsync(devPtr, pitch, value, width, height, stream)
cdef cudaError_t _cudaMemset3DAsync(cudaPitchedPtr pitchedDevPtr, int value, cudaExtent extent, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemset3DAsync(pitchedDevPtr, value, extent, stream)
return cudaMemset3DAsync(pitchedDevPtr, value, extent, stream)
cdef cudaError_t _cudaMemPrefetchAsync(const void* devPtr, size_t count, int dstDevice, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemPrefetchAsync(devPtr, count, dstDevice, stream)
return cudaMemPrefetchAsync(devPtr, count, dstDevice, stream)
cdef cudaError_t _cudaMemPrefetchAsync_v2(const void* devPtr, size_t count, cudaMemLocation location, unsigned int flags, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemPrefetchAsync_v2(devPtr, count, location, flags, stream)
return cudaMemPrefetchAsync_v2(devPtr, count, location, flags, stream)
cdef cudaError_t _cudaMemAdvise(const void* devPtr, size_t count, cudaMemoryAdvise advice, int device) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemAdvise(devPtr, count, advice, device)
return cudaMemAdvise(devPtr, count, advice, device)
cdef cudaError_t _cudaMemAdvise_v2(const void* devPtr, size_t count, cudaMemoryAdvise advice, cudaMemLocation location) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemAdvise_v2(devPtr, count, advice, location)
return cudaMemAdvise_v2(devPtr, count, advice, location)
cdef cudaError_t _cudaMemRangeGetAttribute(void* data, size_t dataSize, cudaMemRangeAttribute attribute, const void* devPtr, size_t count) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemRangeGetAttribute(data, dataSize, attribute, devPtr, count)
return cudaMemRangeGetAttribute(data, dataSize, attribute, devPtr, count)
cdef cudaError_t _cudaMemRangeGetAttributes(void** data, size_t* dataSizes, cudaMemRangeAttribute* attributes, size_t numAttributes, const void* devPtr, size_t count) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemRangeGetAttributes(data, dataSizes, attributes, numAttributes, devPtr, count)
return cudaMemRangeGetAttributes(data, dataSizes, attributes, numAttributes, devPtr, count)
cdef cudaError_t _cudaMemcpyToArray(cudaArray_t dst, size_t wOffset, size_t hOffset, const void* src, size_t count, cudaMemcpyKind kind) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpyToArray(dst, wOffset, hOffset, src, count, kind)
return cudaMemcpyToArray(dst, wOffset, hOffset, src, count, kind)
cdef cudaError_t _cudaMemcpyFromArray(void* dst, cudaArray_const_t src, size_t wOffset, size_t hOffset, size_t count, cudaMemcpyKind kind) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpyFromArray(dst, src, wOffset, hOffset, count, kind)
return cudaMemcpyFromArray(dst, src, wOffset, hOffset, count, kind)
cdef cudaError_t _cudaMemcpyArrayToArray(cudaArray_t dst, size_t wOffsetDst, size_t hOffsetDst, cudaArray_const_t src, size_t wOffsetSrc, size_t hOffsetSrc, size_t count, cudaMemcpyKind kind) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpyArrayToArray(dst, wOffsetDst, hOffsetDst, src, wOffsetSrc, hOffsetSrc, count, kind)
return cudaMemcpyArrayToArray(dst, wOffsetDst, hOffsetDst, src, wOffsetSrc, hOffsetSrc, count, kind)
cdef cudaError_t _cudaMemcpyToArrayAsync(cudaArray_t dst, size_t wOffset, size_t hOffset, const void* src, size_t count, cudaMemcpyKind kind, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpyToArrayAsync(dst, wOffset, hOffset, src, count, kind, stream)
return cudaMemcpyToArrayAsync(dst, wOffset, hOffset, src, count, kind, stream)
cdef cudaError_t _cudaMemcpyFromArrayAsync(void* dst, cudaArray_const_t src, size_t wOffset, size_t hOffset, size_t count, cudaMemcpyKind kind, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemcpyFromArrayAsync(dst, src, wOffset, hOffset, count, kind, stream)
return cudaMemcpyFromArrayAsync(dst, src, wOffset, hOffset, count, kind, stream)
cdef cudaError_t _cudaMallocAsync(void** devPtr, size_t size, cudaStream_t hStream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMallocAsync(devPtr, size, hStream)
return cudaMallocAsync(devPtr, size, hStream)
cdef cudaError_t _cudaFreeAsync(void* devPtr, cudaStream_t hStream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaFreeAsync(devPtr, hStream)
return cudaFreeAsync(devPtr, hStream)
cdef cudaError_t _cudaMemPoolTrimTo(cudaMemPool_t memPool, size_t minBytesToKeep) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemPoolTrimTo(memPool, minBytesToKeep)
return cudaMemPoolTrimTo(memPool, minBytesToKeep)
cdef cudaError_t _cudaMemPoolSetAttribute(cudaMemPool_t memPool, cudaMemPoolAttr attr, void* value) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemPoolSetAttribute(memPool, attr, value)
return cudaMemPoolSetAttribute(memPool, attr, value)
cdef cudaError_t _cudaMemPoolGetAttribute(cudaMemPool_t memPool, cudaMemPoolAttr attr, void* value) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemPoolGetAttribute(memPool, attr, value)
return cudaMemPoolGetAttribute(memPool, attr, value)
cdef cudaError_t _cudaMemPoolSetAccess(cudaMemPool_t memPool, const cudaMemAccessDesc* descList, size_t count) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemPoolSetAccess(memPool, descList, count)
return cudaMemPoolSetAccess(memPool, descList, count)
cdef cudaError_t _cudaMemPoolGetAccess(cudaMemAccessFlags* flags, cudaMemPool_t memPool, cudaMemLocation* location) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemPoolGetAccess(flags, memPool, location)
return cudaMemPoolGetAccess(flags, memPool, location)
cdef cudaError_t _cudaMemPoolCreate(cudaMemPool_t* memPool, const cudaMemPoolProps* poolProps) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemPoolCreate(memPool, poolProps)
return cudaMemPoolCreate(memPool, poolProps)
cdef cudaError_t _cudaMemPoolDestroy(cudaMemPool_t memPool) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemPoolDestroy(memPool)
return cudaMemPoolDestroy(memPool)
cdef cudaError_t _cudaMallocFromPoolAsync(void** ptr, size_t size, cudaMemPool_t memPool, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMallocFromPoolAsync(ptr, size, memPool, stream)
return cudaMallocFromPoolAsync(ptr, size, memPool, stream)
cdef cudaError_t _cudaMemPoolExportToShareableHandle(void* shareableHandle, cudaMemPool_t memPool, cudaMemAllocationHandleType handleType, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemPoolExportToShareableHandle(shareableHandle, memPool, handleType, flags)
return cudaMemPoolExportToShareableHandle(shareableHandle, memPool, handleType, flags)
cdef cudaError_t _cudaMemPoolImportFromShareableHandle(cudaMemPool_t* memPool, void* shareableHandle, cudaMemAllocationHandleType handleType, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemPoolImportFromShareableHandle(memPool, shareableHandle, handleType, flags)
return cudaMemPoolImportFromShareableHandle(memPool, shareableHandle, handleType, flags)
cdef cudaError_t _cudaMemPoolExportPointer(cudaMemPoolPtrExportData* exportData, void* ptr) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemPoolExportPointer(exportData, ptr)
return cudaMemPoolExportPointer(exportData, ptr)
cdef cudaError_t _cudaMemPoolImportPointer(void** ptr, cudaMemPool_t memPool, cudaMemPoolPtrExportData* exportData) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaMemPoolImportPointer(ptr, memPool, exportData)
return cudaMemPoolImportPointer(ptr, memPool, exportData)
cdef cudaError_t _cudaPointerGetAttributes(cudaPointerAttributes* attributes, const void* ptr) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaPointerGetAttributes(attributes, ptr)
return cudaPointerGetAttributes(attributes, ptr)
cdef cudaError_t _cudaDeviceCanAccessPeer(int* canAccessPeer, int device, int peerDevice) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceCanAccessPeer(canAccessPeer, device, peerDevice)
return cudaDeviceCanAccessPeer(canAccessPeer, device, peerDevice)
cdef cudaError_t _cudaDeviceEnablePeerAccess(int peerDevice, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceEnablePeerAccess(peerDevice, flags)
return cudaDeviceEnablePeerAccess(peerDevice, flags)
cdef cudaError_t _cudaDeviceDisablePeerAccess(int peerDevice) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceDisablePeerAccess(peerDevice)
return cudaDeviceDisablePeerAccess(peerDevice)
cdef cudaError_t _cudaGraphicsUnregisterResource(cudaGraphicsResource_t resource) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphicsUnregisterResource(resource)
return cudaGraphicsUnregisterResource(resource)
cdef cudaError_t _cudaGraphicsResourceSetMapFlags(cudaGraphicsResource_t resource, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphicsResourceSetMapFlags(resource, flags)
return cudaGraphicsResourceSetMapFlags(resource, flags)
cdef cudaError_t _cudaGraphicsMapResources(int count, cudaGraphicsResource_t* resources, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphicsMapResources(count, resources, stream)
return cudaGraphicsMapResources(count, resources, stream)
cdef cudaError_t _cudaGraphicsUnmapResources(int count, cudaGraphicsResource_t* resources, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphicsUnmapResources(count, resources, stream)
return cudaGraphicsUnmapResources(count, resources, stream)
cdef cudaError_t _cudaGraphicsResourceGetMappedPointer(void** devPtr, size_t* size, cudaGraphicsResource_t resource) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphicsResourceGetMappedPointer(devPtr, size, resource)
return cudaGraphicsResourceGetMappedPointer(devPtr, size, resource)
cdef cudaError_t _cudaGraphicsSubResourceGetMappedArray(cudaArray_t* array, cudaGraphicsResource_t resource, unsigned int arrayIndex, unsigned int mipLevel) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphicsSubResourceGetMappedArray(array, resource, arrayIndex, mipLevel)
return cudaGraphicsSubResourceGetMappedArray(array, resource, arrayIndex, mipLevel)
cdef cudaError_t _cudaGraphicsResourceGetMappedMipmappedArray(cudaMipmappedArray_t* mipmappedArray, cudaGraphicsResource_t resource) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphicsResourceGetMappedMipmappedArray(mipmappedArray, resource)
return cudaGraphicsResourceGetMappedMipmappedArray(mipmappedArray, resource)
cdef cudaError_t _cudaGetChannelDesc(cudaChannelFormatDesc* desc, cudaArray_const_t array) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetChannelDesc(desc, array)
return cudaGetChannelDesc(desc, array)
@cython.show_performance_hints(False)
cdef cudaChannelFormatDesc _cudaCreateChannelDesc(int x, int y, int z, int w, cudaChannelFormatKind f) except* nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaCreateChannelDesc(x, y, z, w, f)
return cudaCreateChannelDesc(x, y, z, w, f)
cdef cudaError_t _cudaCreateTextureObject(cudaTextureObject_t* pTexObject, const cudaResourceDesc* pResDesc, const cudaTextureDesc* pTexDesc, const cudaResourceViewDesc* pResViewDesc) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaCreateTextureObject(pTexObject, pResDesc, pTexDesc, pResViewDesc)
return cudaCreateTextureObject(pTexObject, pResDesc, pTexDesc, pResViewDesc)
cdef cudaError_t _cudaDestroyTextureObject(cudaTextureObject_t texObject) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDestroyTextureObject(texObject)
return cudaDestroyTextureObject(texObject)
cdef cudaError_t _cudaGetTextureObjectResourceDesc(cudaResourceDesc* pResDesc, cudaTextureObject_t texObject) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetTextureObjectResourceDesc(pResDesc, texObject)
return cudaGetTextureObjectResourceDesc(pResDesc, texObject)
cdef cudaError_t _cudaGetTextureObjectTextureDesc(cudaTextureDesc* pTexDesc, cudaTextureObject_t texObject) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetTextureObjectTextureDesc(pTexDesc, texObject)
return cudaGetTextureObjectTextureDesc(pTexDesc, texObject)
cdef cudaError_t _cudaGetTextureObjectResourceViewDesc(cudaResourceViewDesc* pResViewDesc, cudaTextureObject_t texObject) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetTextureObjectResourceViewDesc(pResViewDesc, texObject)
return cudaGetTextureObjectResourceViewDesc(pResViewDesc, texObject)
cdef cudaError_t _cudaCreateSurfaceObject(cudaSurfaceObject_t* pSurfObject, const cudaResourceDesc* pResDesc) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaCreateSurfaceObject(pSurfObject, pResDesc)
return cudaCreateSurfaceObject(pSurfObject, pResDesc)
cdef cudaError_t _cudaDestroySurfaceObject(cudaSurfaceObject_t surfObject) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDestroySurfaceObject(surfObject)
return cudaDestroySurfaceObject(surfObject)
cdef cudaError_t _cudaGetSurfaceObjectResourceDesc(cudaResourceDesc* pResDesc, cudaSurfaceObject_t surfObject) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetSurfaceObjectResourceDesc(pResDesc, surfObject)
return cudaGetSurfaceObjectResourceDesc(pResDesc, surfObject)
cdef cudaError_t _cudaDriverGetVersion(int* driverVersion) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDriverGetVersion(driverVersion)
return cudaDriverGetVersion(driverVersion)
cdef cudaError_t _cudaRuntimeGetVersion(int* runtimeVersion) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaRuntimeGetVersion(runtimeVersion)
return cudaRuntimeGetVersion(runtimeVersion)
cdef cudaError_t _cudaGraphCreate(cudaGraph_t* pGraph, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphCreate(pGraph, flags)
return cudaGraphCreate(pGraph, flags)
cdef cudaError_t _cudaGraphAddKernelNode(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, size_t numDependencies, const cudaKernelNodeParams* pNodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddKernelNode(pGraphNode, graph, pDependencies, numDependencies, pNodeParams)
return cudaGraphAddKernelNode(pGraphNode, graph, pDependencies, numDependencies, pNodeParams)
cdef cudaError_t _cudaGraphKernelNodeGetParams(cudaGraphNode_t node, cudaKernelNodeParams* pNodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphKernelNodeGetParams(node, pNodeParams)
return cudaGraphKernelNodeGetParams(node, pNodeParams)
cdef cudaError_t _cudaGraphKernelNodeSetParams(cudaGraphNode_t node, const cudaKernelNodeParams* pNodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphKernelNodeSetParams(node, pNodeParams)
return cudaGraphKernelNodeSetParams(node, pNodeParams)
cdef cudaError_t _cudaGraphKernelNodeCopyAttributes(cudaGraphNode_t hSrc, cudaGraphNode_t hDst) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphKernelNodeCopyAttributes(hSrc, hDst)
return cudaGraphKernelNodeCopyAttributes(hSrc, hDst)
cdef cudaError_t _cudaGraphKernelNodeGetAttribute(cudaGraphNode_t hNode, cudaKernelNodeAttrID attr, cudaKernelNodeAttrValue* value_out) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphKernelNodeGetAttribute(hNode, attr, value_out)
return cudaGraphKernelNodeGetAttribute(hNode, attr, value_out)
cdef cudaError_t _cudaGraphKernelNodeSetAttribute(cudaGraphNode_t hNode, cudaKernelNodeAttrID attr, const cudaKernelNodeAttrValue* value) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphKernelNodeSetAttribute(hNode, attr, value)
return cudaGraphKernelNodeSetAttribute(hNode, attr, value)
cdef cudaError_t _cudaGraphAddMemcpyNode(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, size_t numDependencies, const cudaMemcpy3DParms* pCopyParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddMemcpyNode(pGraphNode, graph, pDependencies, numDependencies, pCopyParams)
return cudaGraphAddMemcpyNode(pGraphNode, graph, pDependencies, numDependencies, pCopyParams)
cdef cudaError_t _cudaGraphAddMemcpyNode1D(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, size_t numDependencies, void* dst, const void* src, size_t count, cudaMemcpyKind kind) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddMemcpyNode1D(pGraphNode, graph, pDependencies, numDependencies, dst, src, count, kind)
return cudaGraphAddMemcpyNode1D(pGraphNode, graph, pDependencies, numDependencies, dst, src, count, kind)
cdef cudaError_t _cudaGraphMemcpyNodeGetParams(cudaGraphNode_t node, cudaMemcpy3DParms* pNodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphMemcpyNodeGetParams(node, pNodeParams)
return cudaGraphMemcpyNodeGetParams(node, pNodeParams)
cdef cudaError_t _cudaGraphMemcpyNodeSetParams(cudaGraphNode_t node, const cudaMemcpy3DParms* pNodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphMemcpyNodeSetParams(node, pNodeParams)
return cudaGraphMemcpyNodeSetParams(node, pNodeParams)
cdef cudaError_t _cudaGraphMemcpyNodeSetParams1D(cudaGraphNode_t node, void* dst, const void* src, size_t count, cudaMemcpyKind kind) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphMemcpyNodeSetParams1D(node, dst, src, count, kind)
return cudaGraphMemcpyNodeSetParams1D(node, dst, src, count, kind)
cdef cudaError_t _cudaGraphAddMemsetNode(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, size_t numDependencies, const cudaMemsetParams* pMemsetParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddMemsetNode(pGraphNode, graph, pDependencies, numDependencies, pMemsetParams)
return cudaGraphAddMemsetNode(pGraphNode, graph, pDependencies, numDependencies, pMemsetParams)
cdef cudaError_t _cudaGraphMemsetNodeGetParams(cudaGraphNode_t node, cudaMemsetParams* pNodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphMemsetNodeGetParams(node, pNodeParams)
return cudaGraphMemsetNodeGetParams(node, pNodeParams)
cdef cudaError_t _cudaGraphMemsetNodeSetParams(cudaGraphNode_t node, const cudaMemsetParams* pNodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphMemsetNodeSetParams(node, pNodeParams)
return cudaGraphMemsetNodeSetParams(node, pNodeParams)
cdef cudaError_t _cudaGraphAddHostNode(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, size_t numDependencies, const cudaHostNodeParams* pNodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddHostNode(pGraphNode, graph, pDependencies, numDependencies, pNodeParams)
return cudaGraphAddHostNode(pGraphNode, graph, pDependencies, numDependencies, pNodeParams)
cdef cudaError_t _cudaGraphHostNodeGetParams(cudaGraphNode_t node, cudaHostNodeParams* pNodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphHostNodeGetParams(node, pNodeParams)
return cudaGraphHostNodeGetParams(node, pNodeParams)
cdef cudaError_t _cudaGraphHostNodeSetParams(cudaGraphNode_t node, const cudaHostNodeParams* pNodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphHostNodeSetParams(node, pNodeParams)
return cudaGraphHostNodeSetParams(node, pNodeParams)
cdef cudaError_t _cudaGraphAddChildGraphNode(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, size_t numDependencies, cudaGraph_t childGraph) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddChildGraphNode(pGraphNode, graph, pDependencies, numDependencies, childGraph)
return cudaGraphAddChildGraphNode(pGraphNode, graph, pDependencies, numDependencies, childGraph)
cdef cudaError_t _cudaGraphChildGraphNodeGetGraph(cudaGraphNode_t node, cudaGraph_t* pGraph) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphChildGraphNodeGetGraph(node, pGraph)
return cudaGraphChildGraphNodeGetGraph(node, pGraph)
cdef cudaError_t _cudaGraphAddEmptyNode(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, size_t numDependencies) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddEmptyNode(pGraphNode, graph, pDependencies, numDependencies)
return cudaGraphAddEmptyNode(pGraphNode, graph, pDependencies, numDependencies)
cdef cudaError_t _cudaGraphAddEventRecordNode(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, size_t numDependencies, cudaEvent_t event) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddEventRecordNode(pGraphNode, graph, pDependencies, numDependencies, event)
return cudaGraphAddEventRecordNode(pGraphNode, graph, pDependencies, numDependencies, event)
cdef cudaError_t _cudaGraphEventRecordNodeGetEvent(cudaGraphNode_t node, cudaEvent_t* event_out) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphEventRecordNodeGetEvent(node, event_out)
return cudaGraphEventRecordNodeGetEvent(node, event_out)
cdef cudaError_t _cudaGraphEventRecordNodeSetEvent(cudaGraphNode_t node, cudaEvent_t event) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphEventRecordNodeSetEvent(node, event)
return cudaGraphEventRecordNodeSetEvent(node, event)
cdef cudaError_t _cudaGraphAddEventWaitNode(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, size_t numDependencies, cudaEvent_t event) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddEventWaitNode(pGraphNode, graph, pDependencies, numDependencies, event)
return cudaGraphAddEventWaitNode(pGraphNode, graph, pDependencies, numDependencies, event)
cdef cudaError_t _cudaGraphEventWaitNodeGetEvent(cudaGraphNode_t node, cudaEvent_t* event_out) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphEventWaitNodeGetEvent(node, event_out)
return cudaGraphEventWaitNodeGetEvent(node, event_out)
cdef cudaError_t _cudaGraphEventWaitNodeSetEvent(cudaGraphNode_t node, cudaEvent_t event) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphEventWaitNodeSetEvent(node, event)
return cudaGraphEventWaitNodeSetEvent(node, event)
cdef cudaError_t _cudaGraphAddExternalSemaphoresSignalNode(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, size_t numDependencies, const cudaExternalSemaphoreSignalNodeParams* nodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddExternalSemaphoresSignalNode(pGraphNode, graph, pDependencies, numDependencies, nodeParams)
return cudaGraphAddExternalSemaphoresSignalNode(pGraphNode, graph, pDependencies, numDependencies, nodeParams)
cdef cudaError_t _cudaGraphExternalSemaphoresSignalNodeGetParams(cudaGraphNode_t hNode, cudaExternalSemaphoreSignalNodeParams* params_out) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExternalSemaphoresSignalNodeGetParams(hNode, params_out)
return cudaGraphExternalSemaphoresSignalNodeGetParams(hNode, params_out)
cdef cudaError_t _cudaGraphExternalSemaphoresSignalNodeSetParams(cudaGraphNode_t hNode, const cudaExternalSemaphoreSignalNodeParams* nodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExternalSemaphoresSignalNodeSetParams(hNode, nodeParams)
return cudaGraphExternalSemaphoresSignalNodeSetParams(hNode, nodeParams)
cdef cudaError_t _cudaGraphAddExternalSemaphoresWaitNode(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, size_t numDependencies, const cudaExternalSemaphoreWaitNodeParams* nodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddExternalSemaphoresWaitNode(pGraphNode, graph, pDependencies, numDependencies, nodeParams)
return cudaGraphAddExternalSemaphoresWaitNode(pGraphNode, graph, pDependencies, numDependencies, nodeParams)
cdef cudaError_t _cudaGraphExternalSemaphoresWaitNodeGetParams(cudaGraphNode_t hNode, cudaExternalSemaphoreWaitNodeParams* params_out) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExternalSemaphoresWaitNodeGetParams(hNode, params_out)
return cudaGraphExternalSemaphoresWaitNodeGetParams(hNode, params_out)
cdef cudaError_t _cudaGraphExternalSemaphoresWaitNodeSetParams(cudaGraphNode_t hNode, const cudaExternalSemaphoreWaitNodeParams* nodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExternalSemaphoresWaitNodeSetParams(hNode, nodeParams)
return cudaGraphExternalSemaphoresWaitNodeSetParams(hNode, nodeParams)
cdef cudaError_t _cudaGraphAddMemAllocNode(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, size_t numDependencies, cudaMemAllocNodeParams* nodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddMemAllocNode(pGraphNode, graph, pDependencies, numDependencies, nodeParams)
return cudaGraphAddMemAllocNode(pGraphNode, graph, pDependencies, numDependencies, nodeParams)
cdef cudaError_t _cudaGraphMemAllocNodeGetParams(cudaGraphNode_t node, cudaMemAllocNodeParams* params_out) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphMemAllocNodeGetParams(node, params_out)
return cudaGraphMemAllocNodeGetParams(node, params_out)
cdef cudaError_t _cudaGraphAddMemFreeNode(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, size_t numDependencies, void* dptr) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddMemFreeNode(pGraphNode, graph, pDependencies, numDependencies, dptr)
return cudaGraphAddMemFreeNode(pGraphNode, graph, pDependencies, numDependencies, dptr)
cdef cudaError_t _cudaGraphMemFreeNodeGetParams(cudaGraphNode_t node, void* dptr_out) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphMemFreeNodeGetParams(node, dptr_out)
return cudaGraphMemFreeNodeGetParams(node, dptr_out)
cdef cudaError_t _cudaDeviceGraphMemTrim(int device) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceGraphMemTrim(device)
return cudaDeviceGraphMemTrim(device)
cdef cudaError_t _cudaDeviceGetGraphMemAttribute(int device, cudaGraphMemAttributeType attr, void* value) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceGetGraphMemAttribute(device, attr, value)
return cudaDeviceGetGraphMemAttribute(device, attr, value)
cdef cudaError_t _cudaDeviceSetGraphMemAttribute(int device, cudaGraphMemAttributeType attr, void* value) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaDeviceSetGraphMemAttribute(device, attr, value)
return cudaDeviceSetGraphMemAttribute(device, attr, value)
cdef cudaError_t _cudaGraphClone(cudaGraph_t* pGraphClone, cudaGraph_t originalGraph) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphClone(pGraphClone, originalGraph)
return cudaGraphClone(pGraphClone, originalGraph)
cdef cudaError_t _cudaGraphNodeFindInClone(cudaGraphNode_t* pNode, cudaGraphNode_t originalNode, cudaGraph_t clonedGraph) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphNodeFindInClone(pNode, originalNode, clonedGraph)
return cudaGraphNodeFindInClone(pNode, originalNode, clonedGraph)
cdef cudaError_t _cudaGraphNodeGetType(cudaGraphNode_t node, cudaGraphNodeType* pType) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphNodeGetType(node, pType)
return cudaGraphNodeGetType(node, pType)
cdef cudaError_t _cudaGraphGetNodes(cudaGraph_t graph, cudaGraphNode_t* nodes, size_t* numNodes) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphGetNodes(graph, nodes, numNodes)
return cudaGraphGetNodes(graph, nodes, numNodes)
cdef cudaError_t _cudaGraphGetRootNodes(cudaGraph_t graph, cudaGraphNode_t* pRootNodes, size_t* pNumRootNodes) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphGetRootNodes(graph, pRootNodes, pNumRootNodes)
return cudaGraphGetRootNodes(graph, pRootNodes, pNumRootNodes)
cdef cudaError_t _cudaGraphGetEdges(cudaGraph_t graph, cudaGraphNode_t* from_, cudaGraphNode_t* to, size_t* numEdges) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphGetEdges(graph, from_, to, numEdges)
return cudaGraphGetEdges(graph, from_, to, numEdges)
cdef cudaError_t _cudaGraphGetEdges_v2(cudaGraph_t graph, cudaGraphNode_t* from_, cudaGraphNode_t* to, cudaGraphEdgeData* edgeData, size_t* numEdges) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphGetEdges_v2(graph, from_, to, edgeData, numEdges)
return cudaGraphGetEdges_v2(graph, from_, to, edgeData, numEdges)
cdef cudaError_t _cudaGraphNodeGetDependencies(cudaGraphNode_t node, cudaGraphNode_t* pDependencies, size_t* pNumDependencies) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphNodeGetDependencies(node, pDependencies, pNumDependencies)
return cudaGraphNodeGetDependencies(node, pDependencies, pNumDependencies)
cdef cudaError_t _cudaGraphNodeGetDependencies_v2(cudaGraphNode_t node, cudaGraphNode_t* pDependencies, cudaGraphEdgeData* edgeData, size_t* pNumDependencies) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphNodeGetDependencies_v2(node, pDependencies, edgeData, pNumDependencies)
return cudaGraphNodeGetDependencies_v2(node, pDependencies, edgeData, pNumDependencies)
cdef cudaError_t _cudaGraphNodeGetDependentNodes(cudaGraphNode_t node, cudaGraphNode_t* pDependentNodes, size_t* pNumDependentNodes) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphNodeGetDependentNodes(node, pDependentNodes, pNumDependentNodes)
return cudaGraphNodeGetDependentNodes(node, pDependentNodes, pNumDependentNodes)
cdef cudaError_t _cudaGraphNodeGetDependentNodes_v2(cudaGraphNode_t node, cudaGraphNode_t* pDependentNodes, cudaGraphEdgeData* edgeData, size_t* pNumDependentNodes) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphNodeGetDependentNodes_v2(node, pDependentNodes, edgeData, pNumDependentNodes)
return cudaGraphNodeGetDependentNodes_v2(node, pDependentNodes, edgeData, pNumDependentNodes)
cdef cudaError_t _cudaGraphAddDependencies(cudaGraph_t graph, const cudaGraphNode_t* from_, const cudaGraphNode_t* to, size_t numDependencies) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddDependencies(graph, from_, to, numDependencies)
return cudaGraphAddDependencies(graph, from_, to, numDependencies)
cdef cudaError_t _cudaGraphAddDependencies_v2(cudaGraph_t graph, const cudaGraphNode_t* from_, const cudaGraphNode_t* to, const cudaGraphEdgeData* edgeData, size_t numDependencies) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddDependencies_v2(graph, from_, to, edgeData, numDependencies)
return cudaGraphAddDependencies_v2(graph, from_, to, edgeData, numDependencies)
cdef cudaError_t _cudaGraphRemoveDependencies(cudaGraph_t graph, const cudaGraphNode_t* from_, const cudaGraphNode_t* to, size_t numDependencies) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphRemoveDependencies(graph, from_, to, numDependencies)
return cudaGraphRemoveDependencies(graph, from_, to, numDependencies)
cdef cudaError_t _cudaGraphRemoveDependencies_v2(cudaGraph_t graph, const cudaGraphNode_t* from_, const cudaGraphNode_t* to, const cudaGraphEdgeData* edgeData, size_t numDependencies) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphRemoveDependencies_v2(graph, from_, to, edgeData, numDependencies)
return cudaGraphRemoveDependencies_v2(graph, from_, to, edgeData, numDependencies)
cdef cudaError_t _cudaGraphDestroyNode(cudaGraphNode_t node) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphDestroyNode(node)
return cudaGraphDestroyNode(node)
cdef cudaError_t _cudaGraphInstantiate(cudaGraphExec_t* pGraphExec, cudaGraph_t graph, unsigned long long flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphInstantiate(pGraphExec, graph, flags)
return cudaGraphInstantiate(pGraphExec, graph, flags)
cdef cudaError_t _cudaGraphInstantiateWithFlags(cudaGraphExec_t* pGraphExec, cudaGraph_t graph, unsigned long long flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphInstantiateWithFlags(pGraphExec, graph, flags)
return cudaGraphInstantiateWithFlags(pGraphExec, graph, flags)
cdef cudaError_t _cudaGraphInstantiateWithParams(cudaGraphExec_t* pGraphExec, cudaGraph_t graph, cudaGraphInstantiateParams* instantiateParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphInstantiateWithParams(pGraphExec, graph, instantiateParams)
return cudaGraphInstantiateWithParams(pGraphExec, graph, instantiateParams)
cdef cudaError_t _cudaGraphExecGetFlags(cudaGraphExec_t graphExec, unsigned long long* flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExecGetFlags(graphExec, flags)
return cudaGraphExecGetFlags(graphExec, flags)
cdef cudaError_t _cudaGraphExecKernelNodeSetParams(cudaGraphExec_t hGraphExec, cudaGraphNode_t node, const cudaKernelNodeParams* pNodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExecKernelNodeSetParams(hGraphExec, node, pNodeParams)
return cudaGraphExecKernelNodeSetParams(hGraphExec, node, pNodeParams)
cdef cudaError_t _cudaGraphExecMemcpyNodeSetParams(cudaGraphExec_t hGraphExec, cudaGraphNode_t node, const cudaMemcpy3DParms* pNodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExecMemcpyNodeSetParams(hGraphExec, node, pNodeParams)
return cudaGraphExecMemcpyNodeSetParams(hGraphExec, node, pNodeParams)
cdef cudaError_t _cudaGraphExecMemcpyNodeSetParams1D(cudaGraphExec_t hGraphExec, cudaGraphNode_t node, void* dst, const void* src, size_t count, cudaMemcpyKind kind) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExecMemcpyNodeSetParams1D(hGraphExec, node, dst, src, count, kind)
return cudaGraphExecMemcpyNodeSetParams1D(hGraphExec, node, dst, src, count, kind)
cdef cudaError_t _cudaGraphExecMemsetNodeSetParams(cudaGraphExec_t hGraphExec, cudaGraphNode_t node, const cudaMemsetParams* pNodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExecMemsetNodeSetParams(hGraphExec, node, pNodeParams)
return cudaGraphExecMemsetNodeSetParams(hGraphExec, node, pNodeParams)
cdef cudaError_t _cudaGraphExecHostNodeSetParams(cudaGraphExec_t hGraphExec, cudaGraphNode_t node, const cudaHostNodeParams* pNodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExecHostNodeSetParams(hGraphExec, node, pNodeParams)
return cudaGraphExecHostNodeSetParams(hGraphExec, node, pNodeParams)
cdef cudaError_t _cudaGraphExecChildGraphNodeSetParams(cudaGraphExec_t hGraphExec, cudaGraphNode_t node, cudaGraph_t childGraph) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExecChildGraphNodeSetParams(hGraphExec, node, childGraph)
return cudaGraphExecChildGraphNodeSetParams(hGraphExec, node, childGraph)
cdef cudaError_t _cudaGraphExecEventRecordNodeSetEvent(cudaGraphExec_t hGraphExec, cudaGraphNode_t hNode, cudaEvent_t event) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExecEventRecordNodeSetEvent(hGraphExec, hNode, event)
return cudaGraphExecEventRecordNodeSetEvent(hGraphExec, hNode, event)
cdef cudaError_t _cudaGraphExecEventWaitNodeSetEvent(cudaGraphExec_t hGraphExec, cudaGraphNode_t hNode, cudaEvent_t event) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExecEventWaitNodeSetEvent(hGraphExec, hNode, event)
return cudaGraphExecEventWaitNodeSetEvent(hGraphExec, hNode, event)
cdef cudaError_t _cudaGraphExecExternalSemaphoresSignalNodeSetParams(cudaGraphExec_t hGraphExec, cudaGraphNode_t hNode, const cudaExternalSemaphoreSignalNodeParams* nodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExecExternalSemaphoresSignalNodeSetParams(hGraphExec, hNode, nodeParams)
return cudaGraphExecExternalSemaphoresSignalNodeSetParams(hGraphExec, hNode, nodeParams)
cdef cudaError_t _cudaGraphExecExternalSemaphoresWaitNodeSetParams(cudaGraphExec_t hGraphExec, cudaGraphNode_t hNode, const cudaExternalSemaphoreWaitNodeParams* nodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExecExternalSemaphoresWaitNodeSetParams(hGraphExec, hNode, nodeParams)
return cudaGraphExecExternalSemaphoresWaitNodeSetParams(hGraphExec, hNode, nodeParams)
cdef cudaError_t _cudaGraphNodeSetEnabled(cudaGraphExec_t hGraphExec, cudaGraphNode_t hNode, unsigned int isEnabled) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphNodeSetEnabled(hGraphExec, hNode, isEnabled)
return cudaGraphNodeSetEnabled(hGraphExec, hNode, isEnabled)
cdef cudaError_t _cudaGraphNodeGetEnabled(cudaGraphExec_t hGraphExec, cudaGraphNode_t hNode, unsigned int* isEnabled) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphNodeGetEnabled(hGraphExec, hNode, isEnabled)
return cudaGraphNodeGetEnabled(hGraphExec, hNode, isEnabled)
cdef cudaError_t _cudaGraphExecUpdate(cudaGraphExec_t hGraphExec, cudaGraph_t hGraph, cudaGraphExecUpdateResultInfo* resultInfo) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExecUpdate(hGraphExec, hGraph, resultInfo)
return cudaGraphExecUpdate(hGraphExec, hGraph, resultInfo)
cdef cudaError_t _cudaGraphUpload(cudaGraphExec_t graphExec, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphUpload(graphExec, stream)
return cudaGraphUpload(graphExec, stream)
cdef cudaError_t _cudaGraphLaunch(cudaGraphExec_t graphExec, cudaStream_t stream) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphLaunch(graphExec, stream)
return cudaGraphLaunch(graphExec, stream)
cdef cudaError_t _cudaGraphExecDestroy(cudaGraphExec_t graphExec) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExecDestroy(graphExec)
return cudaGraphExecDestroy(graphExec)
cdef cudaError_t _cudaGraphDestroy(cudaGraph_t graph) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphDestroy(graph)
return cudaGraphDestroy(graph)
cdef cudaError_t _cudaGraphDebugDotPrint(cudaGraph_t graph, const char* path, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphDebugDotPrint(graph, path, flags)
return cudaGraphDebugDotPrint(graph, path, flags)
cdef cudaError_t _cudaUserObjectCreate(cudaUserObject_t* object_out, void* ptr, cudaHostFn_t destroy, unsigned int initialRefcount, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaUserObjectCreate(object_out, ptr, destroy, initialRefcount, flags)
return cudaUserObjectCreate(object_out, ptr, destroy, initialRefcount, flags)
cdef cudaError_t _cudaUserObjectRetain(cudaUserObject_t object, unsigned int count) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaUserObjectRetain(object, count)
return cudaUserObjectRetain(object, count)
cdef cudaError_t _cudaUserObjectRelease(cudaUserObject_t object, unsigned int count) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaUserObjectRelease(object, count)
return cudaUserObjectRelease(object, count)
cdef cudaError_t _cudaGraphRetainUserObject(cudaGraph_t graph, cudaUserObject_t object, unsigned int count, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphRetainUserObject(graph, object, count, flags)
return cudaGraphRetainUserObject(graph, object, count, flags)
cdef cudaError_t _cudaGraphReleaseUserObject(cudaGraph_t graph, cudaUserObject_t object, unsigned int count) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphReleaseUserObject(graph, object, count)
return cudaGraphReleaseUserObject(graph, object, count)
cdef cudaError_t _cudaGraphAddNode(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, size_t numDependencies, cudaGraphNodeParams* nodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddNode(pGraphNode, graph, pDependencies, numDependencies, nodeParams)
return cudaGraphAddNode(pGraphNode, graph, pDependencies, numDependencies, nodeParams)
cdef cudaError_t _cudaGraphAddNode_v2(cudaGraphNode_t* pGraphNode, cudaGraph_t graph, const cudaGraphNode_t* pDependencies, const cudaGraphEdgeData* dependencyData, size_t numDependencies, cudaGraphNodeParams* nodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphAddNode_v2(pGraphNode, graph, pDependencies, dependencyData, numDependencies, nodeParams)
return cudaGraphAddNode_v2(pGraphNode, graph, pDependencies, dependencyData, numDependencies, nodeParams)
cdef cudaError_t _cudaGraphNodeSetParams(cudaGraphNode_t node, cudaGraphNodeParams* nodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphNodeSetParams(node, nodeParams)
return cudaGraphNodeSetParams(node, nodeParams)
cdef cudaError_t _cudaGraphExecNodeSetParams(cudaGraphExec_t graphExec, cudaGraphNode_t node, cudaGraphNodeParams* nodeParams) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphExecNodeSetParams(graphExec, node, nodeParams)
return cudaGraphExecNodeSetParams(graphExec, node, nodeParams)
cdef cudaError_t _cudaGraphConditionalHandleCreate(cudaGraphConditionalHandle* pHandle_out, cudaGraph_t graph, unsigned int defaultLaunchValue, unsigned int flags) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGraphConditionalHandleCreate(pHandle_out, graph, defaultLaunchValue, flags)
return cudaGraphConditionalHandleCreate(pHandle_out, graph, defaultLaunchValue, flags)
cdef cudaError_t _cudaGetDriverEntryPoint(const char* symbol, void** funcPtr, unsigned long long flags, cudaDriverEntryPointQueryResult* driverStatus) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetDriverEntryPoint(symbol, funcPtr, flags, driverStatus)
return cudaGetDriverEntryPoint(symbol, funcPtr, flags, driverStatus)
cdef cudaError_t _cudaGetDriverEntryPointByVersion(const char* symbol, void** funcPtr, unsigned int cudaVersion, unsigned long long flags, cudaDriverEntryPointQueryResult* driverStatus) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetDriverEntryPointByVersion(symbol, funcPtr, cudaVersion, flags, driverStatus)
return cudaGetDriverEntryPointByVersion(symbol, funcPtr, cudaVersion, flags, driverStatus)
cdef cudaError_t _cudaLibraryLoadData(cudaLibrary_t* library, const void* code, cudaJitOption* jitOptions, void** jitOptionsValues, unsigned int numJitOptions, cudaLibraryOption* libraryOptions, void** libraryOptionValues, unsigned int numLibraryOptions) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaLibraryLoadData(library, code, jitOptions, jitOptionsValues, numJitOptions, libraryOptions, libraryOptionValues, numLibraryOptions)
return cudaLibraryLoadData(library, code, jitOptions, jitOptionsValues, numJitOptions, libraryOptions, libraryOptionValues, numLibraryOptions)
cdef cudaError_t _cudaLibraryLoadFromFile(cudaLibrary_t* library, const char* fileName, cudaJitOption* jitOptions, void** jitOptionsValues, unsigned int numJitOptions, cudaLibraryOption* libraryOptions, void** libraryOptionValues, unsigned int numLibraryOptions) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaLibraryLoadFromFile(library, fileName, jitOptions, jitOptionsValues, numJitOptions, libraryOptions, libraryOptionValues, numLibraryOptions)
return cudaLibraryLoadFromFile(library, fileName, jitOptions, jitOptionsValues, numJitOptions, libraryOptions, libraryOptionValues, numLibraryOptions)
cdef cudaError_t _cudaLibraryUnload(cudaLibrary_t library) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaLibraryUnload(library)
return cudaLibraryUnload(library)
cdef cudaError_t _cudaLibraryGetKernel(cudaKernel_t* pKernel, cudaLibrary_t library, const char* name) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaLibraryGetKernel(pKernel, library, name)
return cudaLibraryGetKernel(pKernel, library, name)
cdef cudaError_t _cudaLibraryGetGlobal(void** dptr, size_t* numbytes, cudaLibrary_t library, const char* name) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaLibraryGetGlobal(dptr, numbytes, library, name)
return cudaLibraryGetGlobal(dptr, numbytes, library, name)
cdef cudaError_t _cudaLibraryGetManaged(void** dptr, size_t* numbytes, cudaLibrary_t library, const char* name) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaLibraryGetManaged(dptr, numbytes, library, name)
return cudaLibraryGetManaged(dptr, numbytes, library, name)
cdef cudaError_t _cudaLibraryGetUnifiedFunction(void** fptr, cudaLibrary_t library, const char* symbol) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaLibraryGetUnifiedFunction(fptr, library, symbol)
return cudaLibraryGetUnifiedFunction(fptr, library, symbol)
cdef cudaError_t _cudaLibraryGetKernelCount(unsigned int* count, cudaLibrary_t lib) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaLibraryGetKernelCount(count, lib)
return cudaLibraryGetKernelCount(count, lib)
cdef cudaError_t _cudaLibraryEnumerateKernels(cudaKernel_t* kernels, unsigned int numKernels, cudaLibrary_t lib) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaLibraryEnumerateKernels(kernels, numKernels, lib)
return cudaLibraryEnumerateKernels(kernels, numKernels, lib)
cdef cudaError_t _cudaKernelSetAttributeForDevice(cudaKernel_t kernel, cudaFuncAttribute attr, int value, int device) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaKernelSetAttributeForDevice(kernel, attr, value, device)
return cudaKernelSetAttributeForDevice(kernel, attr, value, device)
cdef cudaError_t _cudaGetExportTable(const void** ppExportTable, const cudaUUID_t* pExportTableId) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetExportTable(ppExportTable, pExportTableId)
return cudaGetExportTable(ppExportTable, pExportTableId)
cdef cudaError_t _cudaGetKernel(cudaKernel_t* kernelPtr, const void* entryFuncAddr) except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaGetKernel(kernelPtr, entryFuncAddr)
return cudaGetKernel(kernelPtr, entryFuncAddr)
@cython.show_performance_hints(False)
cdef cudaPitchedPtr _make_cudaPitchedPtr(void* d, size_t p, size_t xsz, size_t ysz) except* nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._make_cudaPitchedPtr(d, p, xsz, ysz)
return make_cudaPitchedPtr(d, p, xsz, ysz)
@cython.show_performance_hints(False)
cdef cudaPos _make_cudaPos(size_t x, size_t y, size_t z) except* nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._make_cudaPos(x, y, z)
return make_cudaPos(x, y, z)
@cython.show_performance_hints(False)
cdef cudaExtent _make_cudaExtent(size_t w, size_t h, size_t d) except* nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._make_cudaExtent(w, h, d)
return make_cudaExtent(w, h, d)
cdef cudaError_t _cudaProfilerStart() except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaProfilerStart()
return cudaProfilerStart()
cdef cudaError_t _cudaProfilerStop() except ?cudaErrorCallRequiresNewerDriver nogil:
cdef bint usePTDS = cudaPythonInit()
if usePTDS:
return ptds._cudaProfilerStop()
return cudaProfilerStop()
include "../_lib/cyruntime/cyruntime.pxi"