change global function name

2ebc3248 · fsx950223 · 09a717e3 · 2ebc3248 · 2ebc3248
Commit 2ebc3248 authored Jan 13, 2023 by fsx950223
2 changed files
--- a/include/ck/tensor_operation/gpu/device/impl/device_batched_gemm_softmax_gemm_xdl_cshuffle.hpp
+++ b/include/ck/tensor_operation/gpu/device/impl/device_batched_gemm_softmax_gemm_xdl_cshuffle.hpp
@@ -42,7 +42,7 @@ __global__ void
 #if CK_USE_LAUNCH_BOUNDS
    __launch_bounds__(CK_MAX_THREAD_PER_BLOCK, CK_MIN_BLOCK_PER_CU)
 #endif
-        kernel_batched_gemm_softmax_gemm_xdl_cshuffle_v1(
+        kernel_batched_multihead_attention_backward_xdl_cshuffle_v1(
            const FloatAB* __restrict__ p_a_grid,
            const FloatAB* __restrict__ p_b_grid,
            const FloatAB* __restrict__ p_b1_grid,
@@ -540,7 +540,7 @@ struct DeviceBatchedGemmSoftmaxGemm_Xdl_CShuffle
            float ave_time = 0;

            auto launch_kernel = [&](auto has_main_k_block_loop_) {
-                const auto kernel = kernel_batched_gemm_softmax_gemm_xdl_cshuffle_v1<
+                const auto kernel = kernel_batched_multihead_attention_backward_xdl_cshuffle_v1<
                    GridwiseGemm,
                    ADataType, // TODO: distiguish A/B datatype
                    CDataType,

--- a/include/ck/tensor_operation/gpu/device/impl/device_grouped_multihead_attention_backward_xdl_cshuffle.hpp
+++ b/include/ck/tensor_operation/gpu/device/impl/device_grouped_multihead_attention_backward_xdl_cshuffle.hpp
@@ -38,7 +38,7 @@ __global__ void
 #if CK_USE_LAUNCH_BOUNDS
 __launch_bounds__(CK_MAX_THREAD_PER_BLOCK, CK_MIN_BLOCK_PER_CU)
 #endif
-    kernel_grouped_gemm_softmax_gemm_xdl_cshuffle_v1(
+    kernel_grouped_multihead_attention_backward_xdl_cshuffle_v1(
        const void CK_CONSTANT_ADDRESS_SPACE* group_kernel_args,
        const index_t group_count,
        const AElementwiseOperation a_element_op,
@@ -890,14 +890,14 @@ struct DeviceGroupedMultiheadAttentionBackward_Xdl_CShuffle

            auto launch_kernel = [&](auto has_main_k_block_loop_) {
                const auto kernel =
-                    kernel_grouped_gemm_softmax_gemm_xdl_cshuffle_v1<GridwiseGemm,
-                                                                     GroupKernelArg,
-                                                                     AElementwiseOperation,
-                                                                     BElementwiseOperation,
-                                                                     AccElementwiseOperation,
-                                                                     B1ElementwiseOperation,
-                                                                     CElementwiseOperation,
-                                                                     has_main_k_block_loop_>;
+                    kernel_grouped_multihead_attention_backward_xdl_cshuffle_v1<GridwiseGemm,
+                                                                                GroupKernelArg,
+                                                                                AElementwiseOperation,
+                                                                                BElementwiseOperation,
+                                                                                AccElementwiseOperation,
+                                                                                B1ElementwiseOperation,
+                                                                                CElementwiseOperation,
+                                                                                has_main_k_block_loop_>;

                return launch_and_time_kernel(
                    stream_config,