Commit e8c19535 authored by aska-0096's avatar aska-0096
Browse files

update preprocess number for mi308; bring back printout in ckprofiler

parent 47294b4b
......@@ -351,7 +351,10 @@ float launch_and_time_kernel_with_preprocess(const StreamConfig& stream_config,
}
#else
// return total_time / nrepeat;
return (total_time - 0.01 * nrepeat) / nrepeat;
hipDeviceProp_t deviceProps;
hip_check_error(hipGetDeviceProperties(&deviceProps, 0));
float preprocess_offset = deviceProps.multiProcessorCount==80? 0.005 : 0.01;
return (total_time - preprocess_offset * nrepeat) / nrepeat;
#endif
}
else
......
......@@ -267,9 +267,9 @@ bool profile_gemm_multiply_multiply_impl(int do_verification,
float gb_per_sec = num_btype / 1.E6 / ave_time;
// std::cout << "Perf: " << std::setw(10) << ave_time << " ms, " << tflops
// << " TFlops, " << gb_per_sec << " GB/s, " << op_name << ", KBatch "
// << kbatch_curr << std::endl;
std::cout << "Perf: " << std::setw(10) << ave_time << " ms, " << tflops
<< " TFlops, " << gb_per_sec << " GB/s, " << op_name << ", KBatch "
<< kbatch_curr << std::endl;
#if defined CK_ENABLE_FP8 || defined CK_ENABLE_INT8
// set softer tolerances for fp8
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment