#include "../../utils.h" #include "infinirt_cuda.cuh" #include #define CHECK_CUDART(RT_API) CHECK_INTERNAL(RT_API, cudaSuccess) namespace infinirt::cuda { infiniStatus_t getDeviceCount(int *count) { CHECK_CUDART(cudaGetDeviceCount(count)); return INFINI_STATUS_SUCCESS; } infiniStatus_t setDevice(int device_id) { CHECK_CUDART(cudaSetDevice(device_id)); return INFINI_STATUS_SUCCESS; } infiniStatus_t deviceSynchronize() { CHECK_CUDART(cudaDeviceSynchronize()); return INFINI_STATUS_SUCCESS; } infiniStatus_t streamCreate(infinirtStream_t *stream_ptr) { cudaStream_t stream; CHECK_CUDART(cudaStreamCreate(&stream)); *stream_ptr = stream; return INFINI_STATUS_SUCCESS; } infiniStatus_t streamDestroy(infinirtStream_t stream) { CHECK_CUDART(cudaStreamDestroy((cudaStream_t)stream)); return INFINI_STATUS_SUCCESS; } infiniStatus_t streamSynchronize(infinirtStream_t stream) { CHECK_CUDART(cudaStreamSynchronize((cudaStream_t)stream)); return INFINI_STATUS_SUCCESS; } infiniStatus_t streamWaitEvent(infinirtStream_t stream, infinirtEvent_t event) { #ifdef ENABLE_ILUVATAR_API return INFINI_STATUS_NOT_IMPLEMENTED; #else CHECK_CUDART(cudaStreamWaitEvent((cudaStream_t)stream, (cudaEvent_t)event)); return INFINI_STATUS_SUCCESS; #endif } infiniStatus_t eventCreate(infinirtEvent_t *event_ptr) { cudaEvent_t event; CHECK_CUDART(cudaEventCreate(&event)); *event_ptr = event; return INFINI_STATUS_SUCCESS; } infiniStatus_t eventRecord(infinirtEvent_t event, infinirtStream_t stream) { CHECK_CUDART(cudaEventRecord((cudaEvent_t)event, (cudaStream_t)stream)); return INFINI_STATUS_SUCCESS; } infiniStatus_t eventQuery(infinirtEvent_t event, infinirtEventStatus_t *status_ptr) { auto status = cudaEventQuery((cudaEvent_t)event); if (status == cudaSuccess) { *status_ptr = INFINIRT_EVENT_COMPLETE; } else if (status == cudaErrorNotReady) { *status_ptr = INFINIRT_EVENT_NOT_READY; } else { CHECK_CUDART(status); } return INFINI_STATUS_SUCCESS; } infiniStatus_t eventSynchronize(infinirtEvent_t event) { CHECK_CUDART(cudaEventSynchronize((cudaEvent_t)event)); return INFINI_STATUS_SUCCESS; } infiniStatus_t eventDestroy(infinirtEvent_t event) { CHECK_CUDART(cudaEventDestroy((cudaEvent_t)event)); return INFINI_STATUS_SUCCESS; } infiniStatus_t mallocDevice(void **p_ptr, size_t size) { CHECK_CUDART(cudaMalloc(p_ptr, size)); return INFINI_STATUS_SUCCESS; } infiniStatus_t mallocHost(void **p_ptr, size_t size) { CHECK_CUDART(cudaMallocHost(p_ptr, size)); return INFINI_STATUS_SUCCESS; } infiniStatus_t freeDevice(void *ptr) { CHECK_CUDART(cudaFree(ptr)); return INFINI_STATUS_SUCCESS; } infiniStatus_t freeHost(void *ptr) { CHECK_CUDART(cudaFreeHost(ptr)); return INFINI_STATUS_SUCCESS; } cudaMemcpyKind toCudaMemcpyKind(infinirtMemcpyKind_t kind) { switch (kind) { case INFINIRT_MEMCPY_H2D: return cudaMemcpyHostToDevice; case INFINIRT_MEMCPY_D2H: return cudaMemcpyDeviceToHost; case INFINIRT_MEMCPY_D2D: return cudaMemcpyDeviceToDevice; case INFINIRT_MEMCPY_H2H: return cudaMemcpyHostToHost; default: return cudaMemcpyDefault; } } infiniStatus_t memcpy(void *dst, const void *src, size_t size, infinirtMemcpyKind_t kind) { CHECK_CUDART(cudaMemcpy(dst, src, size, toCudaMemcpyKind(kind))); return INFINI_STATUS_SUCCESS; } infiniStatus_t memcpyAsync(void *dst, const void *src, size_t size, infinirtMemcpyKind_t kind, infinirtStream_t stream) { CHECK_CUDART(cudaMemcpyAsync(dst, src, size, toCudaMemcpyKind(kind), (cudaStream_t)stream)); return INFINI_STATUS_SUCCESS; } infiniStatus_t mallocAsync(void **p_ptr, size_t size, infinirtStream_t stream) { CHECK_CUDART(cudaMallocAsync(p_ptr, size, (cudaStream_t)stream)); return INFINI_STATUS_SUCCESS; } infiniStatus_t freeAsync(void *ptr, infinirtStream_t stream) { CHECK_CUDART(cudaFreeAsync(ptr, (cudaStream_t)stream)); return INFINI_STATUS_SUCCESS; } } // namespace infinirt::cuda