"git@developer.sourcefind.cn:yangql/composable_kernel-1.git" did not exist on "5245a0162bbbe5f49be9cc8f2189f53465f691ec"
Unverified Commit 9061d39b authored by Illia Silin's avatar Illia Silin Committed by GitHub
Browse files

Fix the slow cpu reference batched gemm kernels. (#388)

* fix the performance of the batched gemm verification

* fix tabs
parent 1e5b59df
...@@ -83,8 +83,8 @@ struct ReferenceBatchedGemm : public device::BaseOperator ...@@ -83,8 +83,8 @@ struct ReferenceBatchedGemm : public device::BaseOperator
make_ParallelTensorFunctor(f_gmk_gkn_gmn, make_ParallelTensorFunctor(f_gmk_gkn_gmn,
arg.c_g_m_n_.mDesc.GetLengths()[0], arg.c_g_m_n_.mDesc.GetLengths()[0],
arg.c_g_m_n_.mDesc.GetLengths()[1], arg.c_g_m_n_.mDesc.GetLengths()[1],
arg.c_g_m_n_.mDesc.GetLengths()[2])(); arg.c_g_m_n_.mDesc.GetLengths()[2])(
std::thread::hardware_concurrency());
return 0; return 0;
} }
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment