#ifndef CUDA_STREAM_MANAGER_H #define CUDA_STREAM_MANAGER_H #include #include #include #define MAX_STREAMS 16 struct CudaStreamManager { const size_t num_expert; cublasHandle_t* handles; cudaStream_t* streams; CudaStreamManager(const size_t num_expert_) : num_expert(num_expert_) { streams = new cudaStream_t[MAX_STREAMS]; handles = new cublasHandle_t[MAX_STREAMS]; for (size_t i=0; i