#include #include "profile_gemm_reduce_impl.hpp" int main() { using Row = ck::tensor_layout::gemm::RowMajor; using Col = ck::tensor_layout::gemm::ColumnMajor; int M = 512; int N = 256; int K = 128; bool pass = true; pass = pass && ck::profiler:: profile_gemm_reduce_impl( true, 1, false, 1, M, N, K, K, N, N); pass = pass && ck::profiler:: profile_gemm_reduce_impl( true, 1, false, 1, M, N, K, K, K, N); pass = pass && ck::profiler:: profile_gemm_reduce_impl( true, 1, false, 1, M, N, K, M, N, N); pass = pass && ck::profiler:: profile_gemm_reduce_impl( true, 1, false, 1, M, N, K, M, K, N); if(pass) { std::cout << "test GEMM+Reduce fp16: Pass" << std::endl; return 0; } else { std::cout << "test GEMM+Reduce fp16: Fail" << std::endl; return -1; } }