#pragma once #include #include #include namespace spconv { void cutlass_mm_out(torch::Tensor c, torch::Tensor a, torch::Tensor b); void cutlass_mm_out(cudaStream_t stream, torch::Tensor c, torch::Tensor a, torch::Tensor b); } // namespace spconv