clang-format-12

1670bba9 · chenjun · 09852d3b · 1670bba9 · 1670bba9 · 1670bba9
Commit 1670bba9 authored Oct 21, 2024 by chenjun
5 changed files
--- a/include/ck/host_utility/flush_cache.hpp
+++ b/include/ck/host_utility/flush_cache.hpp
@@ -307,15 +307,15 @@ float launch_and_time_kernel_with_preprocess(const StreamConfig& stream_config,
            hip_check_error(hipGetLastError());
            // end real kernel

-//             hip_check_error(hipEventRecord(stop, stream_config.stream_id_));
-//             hip_check_error(hipEventSynchronize(stop));
-//             float cur_time = 0;
-//             hip_check_error(hipEventElapsedTime(&cur_time, start, stop));
-// #if MEDIAN
-//             times.insert(cur_time);
-// #else
-//             total_time += cur_time;
-// #endif
+            //             hip_check_error(hipEventRecord(stop, stream_config.stream_id_));
+            //             hip_check_error(hipEventSynchronize(stop));
+            //             float cur_time = 0;
+            //             hip_check_error(hipEventElapsedTime(&cur_time, start, stop));
+            // #if MEDIAN
+            //             times.insert(cur_time);
+            // #else
+            //             total_time += cur_time;
+            // #endif

            if(ck::EnvIsEnabled(CK_ENV(CK_LOGGING)))
            {
@@ -351,7 +351,7 @@ float launch_and_time_kernel_with_preprocess(const StreamConfig& stream_config,
        }
 #else
        // return total_time / nrepeat;
-        return (total_time - 0.01*nrepeat) / nrepeat;
+        return (total_time - 0.01 * nrepeat) / nrepeat;
 #endif
    }
    else

--- a/include/ck/tensor_operation/gpu/element/element_wise_operation.hpp
+++ b/include/ck/tensor_operation/gpu/element/element_wise_operation.hpp
@@ -277,7 +277,8 @@ struct MultiplyMultiply
    __host__ __device__ constexpr void operator()<ck::half_t, int, ck::half_t, ck::half_t>(
        ck::half_t& e, const int& c, const ck::half_t& d0, const ck::half_t& d1) const
    {
-        const float x0_f = ck::type_convert<float>(c) * ck::type_convert<float>(d0) * ck::type_convert<float>(d1);
+        const float x0_f =
+            ck::type_convert<float>(c) * ck::type_convert<float>(d0) * ck::type_convert<float>(d1);

        e = ck::type_convert<ck::half_t>(x0_f);
    }
@@ -286,7 +287,8 @@ struct MultiplyMultiply
    __host__ __device__ constexpr void operator()<ck::bhalf_t, int, float, float>(
        ck::bhalf_t& e, const int& c, const float& d0, const float& d1) const
    {
-        const float x0_f = ck::type_convert<float>(c) * ck::type_convert<float>(d0) * ck::type_convert<float>(d1);
+        const float x0_f =
+            ck::type_convert<float>(c) * ck::type_convert<float>(d0) * ck::type_convert<float>(d1);

        e = ck::type_convert<ck::bhalf_t>(x0_f);
    }

--- a/include/ck/utility/amd_xdlops.hpp
+++ b/include/ck/utility/amd_xdlops.hpp
--- a/library/src/tensor_operation_instance/gpu/gemm_multiply_multiply/device_gemm_multiply_multiply_xdl_i8_i8_bf16/device_gemm_multiply_multiply_xdl_i8_i8_bf16_mk_nk_mn.hpp
+++ b/library/src/tensor_operation_instance/gpu/gemm_multiply_multiply/device_gemm_multiply_multiply_xdl_i8_i8_bf16/device_gemm_multiply_multiply_xdl_i8_i8_bf16_mk_nk_mn.hpp
--- a/profiler/include/profiler/profile_gemm_multiply_multiply_impl.hpp
+++ b/profiler/include/profiler/profile_gemm_multiply_multiply_impl.hpp
@@ -274,8 +274,9 @@ bool profile_gemm_multiply_multiply_impl(int do_verification,
 #if defined CK_ENABLE_FP8 || defined CK_ENABLE_INT8
                // set softer tolerances for fp8
                if constexpr((is_same_v<ADataType, f8_t> || is_same_v<BDataType, f8_t> ||
-                             is_same_v<EDataType, f8_t>) || (is_same_v<ADataType, int8_t> ||
-                             is_same_v<BDataType, int8_t>  || is_same_v<EDataType, int8_t>))
+                              is_same_v<EDataType, f8_t>) ||
+                             (is_same_v<ADataType, int8_t> || is_same_v<BDataType, int8_t> ||
+                              is_same_v<EDataType, int8_t>))
                {
                    std::string msg = "Error: Incorrect results!";
                    double rtol     = 1e-1;