Commit 4dd82801 authored by Adam Osewski's avatar Adam Osewski
Browse files

Small refinements.

parent fe96e8fb
...@@ -744,7 +744,7 @@ struct DeviceGroupedGemmMultipleD_Dl : public DeviceGroupedGemm<ALayout, ...@@ -744,7 +744,7 @@ struct DeviceGroupedGemmMultipleD_Dl : public DeviceGroupedGemm<ALayout,
<< K1 << ", " << K1 << ", "
<< M1PerThread << ", " << M1PerThread << ", "
<< N1PerThread << ", " << N1PerThread << ", "
<< KPerThread << KPerThread << ", "
<< getGemmSpecializationString(GemmSpec) << getGemmSpecializationString(GemmSpec)
<< ">"; << ">";
// clang-format on // clang-format on
......
...@@ -315,7 +315,7 @@ struct GridwiseGemmDlMultipleD_km_kn_mn ...@@ -315,7 +315,7 @@ struct GridwiseGemmDlMultipleD_km_kn_mn
static_assert(a_block_desc_k0_m0_m1_k1.GetElementSpaceSize() == static_assert(a_block_desc_k0_m0_m1_k1.GetElementSpaceSize() ==
a_k0_m_k1_block_desc.GetElementSpaceSize() && a_k0_m_k1_block_desc.GetElementSpaceSize() &&
b_block_desc_k0_n0_n1_k1.GetElementSpaceSize() == b_block_desc_k0_n0_n1_k1.GetElementSpaceSize() ==
b_k0_n_k1_block_desc.GetElementSpaceSize() && b_k0_n_k1_block_desc.GetElementSpaceSize(),
"wrong!"); "wrong!");
// A matrix blockwise copy // A matrix blockwise copy
......
...@@ -253,7 +253,12 @@ bool profile_grouped_gemm_impl(int do_verification, ...@@ -253,7 +253,12 @@ bool profile_grouped_gemm_impl(int do_verification,
c_element_op); c_element_op);
ref_invoker.Run(ref_argument); ref_invoker.Run(ref_argument);
pass = pass && ck::utils::check_err(c_m_n_device_results[i], c_m_n_host_result); bool group_pass =
ck::utils::check_err(c_m_n_device_results[i], c_m_n_host_result);
pass = pass && group_pass;
std::cout << "group: " << i << " verification result: " << std::boolalpha
<< group_pass << std::endl;
if(do_log) if(do_log)
{ {
...@@ -276,6 +281,11 @@ bool profile_grouped_gemm_impl(int do_verification, ...@@ -276,6 +281,11 @@ bool profile_grouped_gemm_impl(int do_verification,
} }
} }
if(do_verification)
{
std::cout << "Verification: " << (pass ? "SUCCESS" : "FAILURE") << std::endl;
}
std::cout << "Best Perf: " << best_ave_time << " ms, " << best_tflops << " TFlops, " std::cout << "Best Perf: " << best_ave_time << " ms, " << best_tflops << " TFlops, "
<< best_gb_per_sec << " GB/s, " << best_gemm_name << std::endl; << best_gb_per_sec << " GB/s, " << best_gemm_name << std::endl;
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment