Commit e8c19535 authored by aska-0096's avatar aska-0096
Browse files

update preprocess number for mi308; bring back printout in ckprofiler

parent 47294b4b
...@@ -351,7 +351,10 @@ float launch_and_time_kernel_with_preprocess(const StreamConfig& stream_config, ...@@ -351,7 +351,10 @@ float launch_and_time_kernel_with_preprocess(const StreamConfig& stream_config,
} }
#else #else
// return total_time / nrepeat; // return total_time / nrepeat;
return (total_time - 0.01 * nrepeat) / nrepeat; hipDeviceProp_t deviceProps;
hip_check_error(hipGetDeviceProperties(&deviceProps, 0));
float preprocess_offset = deviceProps.multiProcessorCount==80? 0.005 : 0.01;
return (total_time - preprocess_offset * nrepeat) / nrepeat;
#endif #endif
} }
else else
......
...@@ -267,9 +267,9 @@ bool profile_gemm_multiply_multiply_impl(int do_verification, ...@@ -267,9 +267,9 @@ bool profile_gemm_multiply_multiply_impl(int do_verification,
float gb_per_sec = num_btype / 1.E6 / ave_time; float gb_per_sec = num_btype / 1.E6 / ave_time;
// std::cout << "Perf: " << std::setw(10) << ave_time << " ms, " << tflops std::cout << "Perf: " << std::setw(10) << ave_time << " ms, " << tflops
// << " TFlops, " << gb_per_sec << " GB/s, " << op_name << ", KBatch " << " TFlops, " << gb_per_sec << " GB/s, " << op_name << ", KBatch "
// << kbatch_curr << std::endl; << kbatch_curr << std::endl;
#if defined CK_ENABLE_FP8 || defined CK_ENABLE_INT8 #if defined CK_ENABLE_FP8 || defined CK_ENABLE_INT8
// set softer tolerances for fp8 // set softer tolerances for fp8
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment