Merge commit '30480288' into conv_quant_int8

f0f943ff · rocking · 48c85879 · 30480288 · f0f943ff · f0f943ff
Commit f0f943ff authored Oct 14, 2022 by rocking
5 changed files
--- a/test/batched_gemm_softmax_gemm/test_batched_gemm_softmax_gemm_util.hpp
+++ b/test/batched_gemm_softmax_gemm/test_batched_gemm_softmax_gemm_util.hpp
@@ -5,7 +5,7 @@

 #include <vector>
 #include "ck/tensor_operation/gpu/device/gemm_specialization.hpp"
-#include "ck/tensor_operation/gpu/device/device_batched_gemm_softmax_gemm_xdl_cshuffle.hpp"
+#include "ck/tensor_operation/gpu/device/impl/device_batched_gemm_softmax_gemm_xdl_cshuffle.hpp"
 #include "profiler/include/profile_batched_gemm_softmax_gemm_impl.hpp"
 using ck::tensor_operation::device::GemmSpecialization;


--- a/test/convnd_bwd_data/convnd_bwd_data.cpp
+++ b/test/convnd_bwd_data/convnd_bwd_data.cpp
@@ -5,237 +5,89 @@
 #include <iostream>
 #include <initializer_list>
 #include <vector>
+#include <tuple>
 #include <gtest/gtest.h>

 #include "profiler/include/profile_conv_bwd_data_impl.hpp"

+template <typename Tuple>
 class TestConvndBwdData : public ::testing::Test
 {
    protected:
+    using DataType = std::tuple_element_t<0, Tuple>;
    std::vector<ck::utils::conv::ConvParam> conv_params;
-};

-// 1d
-TEST_F(TestConvndBwdData, Conv1dBwdData)
-{
-    conv_params.clear();
-    conv_params.push_back({1, 1, 128, 128, 256, {1}, {14}, {2}, {1}, {0}, {0}});
-    conv_params.push_back({1, 1, 128, 128, 256, {3}, {28}, {1}, {1}, {1}, {1}});
-    conv_params.push_back({1, 1, 128, 128, 256, {1}, {3}, {1}, {1}, {0}, {0}});
-
-    for(auto& param : conv_params)
+    template <ck::index_t NDimSpatial>
+    void Run()
    {
-        bool pass;
-
-        // fp32
-        pass = ck::profiler::profile_conv_bwd_data_impl<1,
-                                                        ck::tensor_layout::convolution::NWC,
-                                                        ck::tensor_layout::convolution::KXC,
-                                                        ck::tensor_layout::convolution::NWK,
-                                                        float,
-                                                        float,
-                                                        float>(true,  // do_verification
-                                                               1,     // init_method
-                                                               false, // do_log
-                                                               false, // time_kernel
-                                                               param);
-
-        EXPECT_TRUE(pass);
-
-        // fp16
-        pass = ck::profiler::profile_conv_bwd_data_impl<1,
-                                                        ck::tensor_layout::convolution::NWC,
-                                                        ck::tensor_layout::convolution::KXC,
-                                                        ck::tensor_layout::convolution::NWK,
-                                                        ck::half_t,
-                                                        ck::half_t,
-                                                        ck::half_t>(true,  // do_verification
-                                                                    1,     // init_method
-                                                                    false, // do_log
-                                                                    false, // time_kernel
-                                                                    param);
-
-        EXPECT_TRUE(pass);
-
-        // bf16
-        pass = ck::profiler::profile_conv_bwd_data_impl<1,
-                                                        ck::tensor_layout::convolution::NWC,
-                                                        ck::tensor_layout::convolution::KXC,
-                                                        ck::tensor_layout::convolution::NWK,
-                                                        ck::bhalf_t,
-                                                        ck::bhalf_t,
-                                                        ck::bhalf_t>(true,  // do_verification
-                                                                     1,     // init_method
-                                                                     false, // do_log
-                                                                     false, // time_kernel
-                                                                     param);
-
-        EXPECT_TRUE(pass);
+        for(auto& param : conv_params)
+        {
+            bool pass;
+            EXPECT_FALSE(conv_params.empty());
+            pass = ck::profiler::profile_conv_bwd_data_impl<
+                NDimSpatial,
+                ck::tuple_element_t<NDimSpatial - 1,
+                                    ck::Tuple<ck::tensor_layout::convolution::NWC,
+                                              ck::tensor_layout::convolution::NHWC,
+                                              ck::tensor_layout::convolution::NDHWC>>,
+                ck::tuple_element_t<NDimSpatial - 1,
+                                    ck::Tuple<ck::tensor_layout::convolution::KXC,
+                                              ck::tensor_layout::convolution::KYXC,
+                                              ck::tensor_layout::convolution::KZYXC>>,
+                ck::tuple_element_t<NDimSpatial - 1,
+                                    ck::Tuple<ck::tensor_layout::convolution::NWK,
+                                              ck::tensor_layout::convolution::NHWK,
+                                              ck::tensor_layout::convolution::NDHWK>>,
+                DataType,
+                DataType,
+                DataType>(true,  // do_verification
+                          1,     // init_method integer value
+                          false, // do_log
+                          false, // time_kernel
+                          param);
+            EXPECT_TRUE(pass);
+        }
+    }
+};

-        // int8
-        pass = ck::profiler::profile_conv_bwd_data_impl<1,
-                                                        ck::tensor_layout::convolution::NWC,
-                                                        ck::tensor_layout::convolution::KXC,
-                                                        ck::tensor_layout::convolution::NWK,
-                                                        int8_t,
-                                                        int8_t,
-                                                        int8_t>(true,  // do_verification
-                                                                1,     // init_method
-                                                                false, // do_log
-                                                                false, // time_kernel
-                                                                param);
+using KernelTypes = ::testing::Types<std::tuple<float>,
+                                     std::tuple<ck::half_t>,
+                                     std::tuple<ck::bhalf_t>,
+                                     std::tuple<std::int8_t>>;
+TYPED_TEST_SUITE(TestConvndBwdData, KernelTypes);

-        EXPECT_TRUE(pass);
-    }
+// 1d
+TYPED_TEST(TestConvndBwdData, Conv1dBwdData)
+{
+    this->conv_params.clear();
+    this->conv_params.push_back({1, 1, 128, 128, 256, {1}, {14}, {2}, {1}, {0}, {0}});
+    this->conv_params.push_back({1, 1, 128, 128, 256, {3}, {28}, {1}, {1}, {1}, {1}});
+    this->conv_params.push_back({1, 1, 128, 128, 256, {1}, {3}, {1}, {1}, {0}, {0}});
+    this->template Run<1>();
 }

 // 2d
-TEST_F(TestConvndBwdData, Conv2dBwdData)
+TYPED_TEST(TestConvndBwdData, Conv2dBwdData)
 {
-    conv_params.clear();
-    conv_params.push_back({2, 1, 128, 128, 256, {1, 1}, {7, 7}, {2, 2}, {1, 1}, {0, 0}, {0, 0}});
-    conv_params.push_back({2, 1, 128, 128, 256, {3, 3}, {14, 14}, {1, 1}, {1, 1}, {1, 1}, {1, 1}});
-    conv_params.push_back({2, 1, 128, 128, 256, {1, 1}, {3, 3}, {1, 1}, {1, 1}, {0, 0}, {0, 0}});
-
-    for(auto& param : conv_params)
-    {
-        bool pass;
-
-        // fp32
-        pass = ck::profiler::profile_conv_bwd_data_impl<2,
-                                                        ck::tensor_layout::convolution::NHWC,
-                                                        ck::tensor_layout::convolution::KYXC,
-                                                        ck::tensor_layout::convolution::NHWK,
-                                                        float,
-                                                        float,
-                                                        float>(true,  // do_verification
-                                                               1,     // init_method
-                                                               false, // do_log
-                                                               false, // time_kernel
-                                                               param);
-
-        EXPECT_TRUE(pass);
-
-        // fp16
-        pass = ck::profiler::profile_conv_bwd_data_impl<2,
-                                                        ck::tensor_layout::convolution::NHWC,
-                                                        ck::tensor_layout::convolution::KYXC,
-                                                        ck::tensor_layout::convolution::NHWK,
-                                                        ck::half_t,
-                                                        ck::half_t,
-                                                        ck::half_t>(true,  // do_verification
-                                                                    1,     // init_method
-                                                                    false, // do_log
-                                                                    false, // time_kernel
-                                                                    param);
-
-        EXPECT_TRUE(pass);
-
-        // bf16
-        pass = ck::profiler::profile_conv_bwd_data_impl<2,
-                                                        ck::tensor_layout::convolution::NHWC,
-                                                        ck::tensor_layout::convolution::KYXC,
-                                                        ck::tensor_layout::convolution::NHWK,
-                                                        ck::bhalf_t,
-                                                        ck::bhalf_t,
-                                                        ck::bhalf_t>(true,  // do_verification
-                                                                     1,     // init_method
-                                                                     false, // do_log
-                                                                     false, // time_kernel
-                                                                     param);
-
-        EXPECT_TRUE(pass);
-
-        // int8
-        pass = ck::profiler::profile_conv_bwd_data_impl<2,
-                                                        ck::tensor_layout::convolution::NHWC,
-                                                        ck::tensor_layout::convolution::KYXC,
-                                                        ck::tensor_layout::convolution::NHWK,
-                                                        int8_t,
-                                                        int8_t,
-                                                        int8_t>(true,  // do_verification
-                                                                1,     // init_method
-                                                                false, // do_log
-                                                                false, // time_kernel
-                                                                param);
-
-        EXPECT_TRUE(pass);
-    }
+    this->conv_params.clear();
+    this->conv_params.push_back(
+        {2, 1, 128, 128, 256, {1, 1}, {7, 7}, {2, 2}, {1, 1}, {0, 0}, {0, 0}});
+    this->conv_params.push_back(
+        {2, 1, 128, 128, 256, {3, 3}, {14, 14}, {1, 1}, {1, 1}, {1, 1}, {1, 1}});
+    this->conv_params.push_back(
+        {2, 1, 128, 128, 256, {1, 1}, {3, 3}, {1, 1}, {1, 1}, {0, 0}, {0, 0}});
+    this->template Run<2>();
 }

 // 3d
-TEST_F(TestConvndBwdData, Conv3dBwdData)
+TYPED_TEST(TestConvndBwdData, Conv3dBwdData)
 {
-    conv_params.clear();
-    conv_params.push_back(
+    this->conv_params.clear();
+    this->conv_params.push_back(
        {3, 1, 128, 128, 256, {1, 1, 1}, {7, 7, 7}, {2, 2, 2}, {1, 1, 1}, {0, 0, 0}, {0, 0, 0}});
-    conv_params.push_back(
+    this->conv_params.push_back(
        {3, 1, 128, 128, 256, {3, 3, 3}, {14, 14, 3}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}});
-    conv_params.push_back(
+    this->conv_params.push_back(
        {3, 1, 128, 128, 256, {1, 1, 1}, {3, 3, 3}, {1, 1, 1}, {1, 1, 1}, {0, 0, 0}, {0, 0, 0}});
-
-    for(auto& param : conv_params)
-    {
-        bool pass;
-
-        // fp32
-        pass = ck::profiler::profile_conv_bwd_data_impl<3,
-                                                        ck::tensor_layout::convolution::NDHWC,
-                                                        ck::tensor_layout::convolution::KZYXC,
-                                                        ck::tensor_layout::convolution::NDHWK,
-                                                        float,
-                                                        float,
-                                                        float>(true,  // do_verification
-                                                               1,     // init_method
-                                                               false, // do_log
-                                                               false, // time_kernel
-                                                               param);
-
-        EXPECT_TRUE(pass);
-
-        // fp16
-        pass = ck::profiler::profile_conv_bwd_data_impl<3,
-                                                        ck::tensor_layout::convolution::NDHWC,
-                                                        ck::tensor_layout::convolution::KZYXC,
-                                                        ck::tensor_layout::convolution::NDHWK,
-                                                        ck::half_t,
-                                                        ck::half_t,
-                                                        ck::half_t>(true,  // do_verification
-                                                                    1,     // init_method
-                                                                    false, // do_log
-                                                                    false, // time_kernel
-                                                                    param);
-
-        EXPECT_TRUE(pass);
-
-        // bf16
-        pass = ck::profiler::profile_conv_bwd_data_impl<3,
-                                                        ck::tensor_layout::convolution::NDHWC,
-                                                        ck::tensor_layout::convolution::KZYXC,
-                                                        ck::tensor_layout::convolution::NDHWK,
-                                                        ck::bhalf_t,
-                                                        ck::bhalf_t,
-                                                        ck::bhalf_t>(true,  // do_verification
-                                                                     1,     // init_method
-                                                                     false, // do_log
-                                                                     false, // time_kernel
-                                                                     param);
-
-        EXPECT_TRUE(pass);
-
-        // int8
-        pass = ck::profiler::profile_conv_bwd_data_impl<3,
-                                                        ck::tensor_layout::convolution::NDHWC,
-                                                        ck::tensor_layout::convolution::KZYXC,
-                                                        ck::tensor_layout::convolution::NDHWK,
-                                                        int8_t,
-                                                        int8_t,
-                                                        int8_t>(true,  // do_verification
-                                                                1,     // init_method
-                                                                false, // do_log
-                                                                false, // time_kernel
-                                                                param);
-
-        EXPECT_TRUE(pass);
-    }
+    this->template Run<3>();
 }
--- a/test/convnd_bwd_weight/convnd_bwd_weight.cpp
+++ b/test/convnd_bwd_weight/convnd_bwd_weight.cpp
@@ -5,201 +5,86 @@
 #include <iostream>
 #include <initializer_list>
 #include <vector>
+#include <tuple>
 #include <gtest/gtest.h>

 #include "profiler/include/profile_conv_bwd_weight_impl.hpp"

+template <typename Tuple>
 class TestConvndBwdWeight : public ::testing::Test
 {
    protected:
+    using DataType = std::tuple_element_t<0, Tuple>;
    std::vector<ck::utils::conv::ConvParam> conv_params;
-};
-
-// 1d
-TEST_F(TestConvndBwdWeight, Conv1dBwdWeight)
-{
-    conv_params.clear();
-    conv_params.push_back({1, 1, 128, 128, 256, {1}, {14}, {2}, {1}, {0}, {0}});
-    conv_params.push_back({1, 1, 128, 128, 256, {3}, {28}, {1}, {1}, {1}, {1}});
-    conv_params.push_back({1, 1, 128, 128, 256, {1}, {3}, {1}, {1}, {0}, {0}});
+    ck::index_t split_k{2};

-    for(auto& param : conv_params)
+    template <ck::index_t NDimSpatial>
+    void Run()
    {
-        bool pass;
-
-        // fp32
-        pass = ck::profiler::profile_conv_bwd_weight_impl<1,
-                                                          ck::tensor_layout::convolution::NWC,
-                                                          ck::tensor_layout::convolution::KXC,
-                                                          ck::tensor_layout::convolution::NWK,
-                                                          float,
-                                                          float,
-                                                          float>(true,  // do_verification
-                                                                 1,     // init_method
-                                                                 false, // do_log
-                                                                 false, // time_kernel
-                                                                 param,
-                                                                 2);
-
-        EXPECT_TRUE(pass);
-
-        // fp16
-        pass = ck::profiler::profile_conv_bwd_weight_impl<1,
-                                                          ck::tensor_layout::convolution::NWC,
-                                                          ck::tensor_layout::convolution::KXC,
-                                                          ck::tensor_layout::convolution::NWK,
-                                                          ck::half_t,
-                                                          ck::half_t,
-                                                          ck::half_t>(true,  // do_verification
-                                                                      1,     // init_method
-                                                                      false, // do_log
-                                                                      false, // time_kernel
-                                                                      param,
-                                                                      2);
-
-        EXPECT_TRUE(pass);
+        for(auto& param : conv_params)
+        {
+            bool pass;
+            EXPECT_FALSE(conv_params.empty());
+            pass = ck::profiler::profile_conv_bwd_weight_impl<
+                NDimSpatial,
+                ck::tuple_element_t<NDimSpatial - 1,
+                                    ck::Tuple<ck::tensor_layout::convolution::NWC,
+                                              ck::tensor_layout::convolution::NHWC,
+                                              ck::tensor_layout::convolution::NDHWC>>,
+                ck::tuple_element_t<NDimSpatial - 1,
+                                    ck::Tuple<ck::tensor_layout::convolution::KXC,
+                                              ck::tensor_layout::convolution::KYXC,
+                                              ck::tensor_layout::convolution::KZYXC>>,
+                ck::tuple_element_t<NDimSpatial - 1,
+                                    ck::Tuple<ck::tensor_layout::convolution::NWK,
+                                              ck::tensor_layout::convolution::NHWK,
+                                              ck::tensor_layout::convolution::NDHWK>>,
+                DataType,
+                DataType,
+                DataType>(true,  // do_verification
+                          1,     // init_method integer value
+                          false, // do_log
+                          false, // time_kernel
+                          param,
+                          split_k);
+            EXPECT_TRUE(pass);
+        }
+    }
+};

-        // bf16
-        pass = ck::profiler::profile_conv_bwd_weight_impl<1,
-                                                          ck::tensor_layout::convolution::NWC,
-                                                          ck::tensor_layout::convolution::KXC,
-                                                          ck::tensor_layout::convolution::NWK,
-                                                          ck::bhalf_t,
-                                                          ck::bhalf_t,
-                                                          ck::bhalf_t>(true,  // do_verification
-                                                                       1,     // init_method
-                                                                       false, // do_log
-                                                                       false, // time_kernel
-                                                                       param,
-                                                                       2);
+using KernelTypes =
+    ::testing::Types<std::tuple<float>, std::tuple<ck::half_t>, std::tuple<ck::bhalf_t>>;
+TYPED_TEST_SUITE(TestConvndBwdWeight, KernelTypes);

-        EXPECT_TRUE(pass);
-    }
+TYPED_TEST(TestConvndBwdWeight, Test1D)
+{
+    this->conv_params.clear();
+    this->conv_params.push_back({1, 1, 128, 128, 256, {1}, {14}, {2}, {1}, {0}, {0}});
+    this->conv_params.push_back({1, 1, 128, 128, 256, {3}, {28}, {1}, {1}, {1}, {1}});
+    this->conv_params.push_back({1, 1, 128, 128, 256, {1}, {3}, {1}, {1}, {0}, {0}});
+    this->template Run<1>();
 }

-// 2d
-TEST_F(TestConvndBwdWeight, Conv2dBwdWeight)
+TYPED_TEST(TestConvndBwdWeight, Test2D)
 {
-    conv_params.clear();
-    conv_params.push_back({2, 1, 128, 128, 256, {1, 1}, {7, 7}, {2, 2}, {1, 1}, {0, 0}, {0, 0}});
-    conv_params.push_back({2, 1, 32, 128, 256, {3, 3}, {14, 14}, {1, 1}, {1, 1}, {1, 1}, {1, 1}});
-    conv_params.push_back({2, 1, 128, 128, 256, {1, 1}, {3, 3}, {1, 1}, {1, 1}, {0, 0}, {0, 0}});
-
-    for(auto& param : conv_params)
-    {
-        bool pass;
-
-        // fp32
-        pass = ck::profiler::profile_conv_bwd_weight_impl<2,
-                                                          ck::tensor_layout::convolution::NHWC,
-                                                          ck::tensor_layout::convolution::KYXC,
-                                                          ck::tensor_layout::convolution::NHWK,
-                                                          float,
-                                                          float,
-                                                          float>(true,  // do_verification
-                                                                 1,     // init_method
-                                                                 false, // do_log
-                                                                 false, // time_kernel
-                                                                 param,
-                                                                 2);
-
-        EXPECT_TRUE(pass);
-
-        // fp16
-        pass = ck::profiler::profile_conv_bwd_weight_impl<2,
-                                                          ck::tensor_layout::convolution::NHWC,
-                                                          ck::tensor_layout::convolution::KYXC,
-                                                          ck::tensor_layout::convolution::NHWK,
-                                                          ck::half_t,
-                                                          ck::half_t,
-                                                          ck::half_t>(true,  // do_verification
-                                                                      1,     // init_method
-                                                                      false, // do_log
-                                                                      false, // time_kernel
-                                                                      param,
-                                                                      2);
-
-        EXPECT_TRUE(pass);
-
-        // bf16
-        pass = ck::profiler::profile_conv_bwd_weight_impl<2,
-                                                          ck::tensor_layout::convolution::NHWC,
-                                                          ck::tensor_layout::convolution::KYXC,
-                                                          ck::tensor_layout::convolution::NHWK,
-                                                          ck::bhalf_t,
-                                                          ck::bhalf_t,
-                                                          ck::bhalf_t>(true,  // do_verification
-                                                                       1,     // init_method
-                                                                       false, // do_log
-                                                                       false, // time_kernel
-                                                                       param,
-                                                                       2);
-
-        EXPECT_TRUE(pass);
-    }
+    this->conv_params.clear();
+    this->conv_params.push_back(
+        {2, 1, 128, 128, 256, {1, 1}, {7, 7}, {2, 2}, {1, 1}, {0, 0}, {0, 0}});
+    this->conv_params.push_back(
+        {2, 1, 32, 128, 256, {3, 3}, {14, 14}, {1, 1}, {1, 1}, {1, 1}, {1, 1}});
+    this->conv_params.push_back(
+        {2, 1, 128, 128, 256, {1, 1}, {3, 3}, {1, 1}, {1, 1}, {0, 0}, {0, 0}});
+    this->template Run<2>();
 }

-// 3d
-TEST_F(TestConvndBwdWeight, Conv3dBwdWeight)
+TYPED_TEST(TestConvndBwdWeight, Test3D)
 {
-    conv_params.clear();
-    conv_params.push_back(
+    this->conv_params.clear();
+    this->conv_params.push_back(
        {3, 1, 128, 128, 256, {1, 1, 1}, {7, 7, 7}, {2, 2, 2}, {1, 1, 1}, {0, 0, 0}, {0, 0, 0}});
-    conv_params.push_back(
+    this->conv_params.push_back(
        {3, 1, 32, 128, 256, {3, 3, 3}, {14, 14, 3}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}});
-    conv_params.push_back(
+    this->conv_params.push_back(
        {3, 1, 128, 128, 256, {1, 1, 1}, {3, 3, 3}, {1, 1, 1}, {1, 1, 1}, {0, 0, 0}, {0, 0, 0}});
-
-    for(auto& param : conv_params)
-    {
-        bool pass;
-
-        // fp32
-        pass = ck::profiler::profile_conv_bwd_weight_impl<3,
-                                                          ck::tensor_layout::convolution::NDHWC,
-                                                          ck::tensor_layout::convolution::KZYXC,
-                                                          ck::tensor_layout::convolution::NDHWK,
-                                                          float,
-                                                          float,
-                                                          float>(true,  // do_verification
-                                                                 1,     // init_method
-                                                                 false, // do_log
-                                                                 false, // time_kernel
-                                                                 param,
-                                                                 2);
-
-        EXPECT_TRUE(pass);
-
-        // fp16
-        pass = ck::profiler::profile_conv_bwd_weight_impl<3,
-                                                          ck::tensor_layout::convolution::NDHWC,
-                                                          ck::tensor_layout::convolution::KZYXC,
-                                                          ck::tensor_layout::convolution::NDHWK,
-                                                          ck::half_t,
-                                                          ck::half_t,
-                                                          ck::half_t>(true,  // do_verification
-                                                                      1,     // init_method
-                                                                      false, // do_log
-                                                                      false, // time_kernel
-                                                                      param,
-                                                                      2);
-
-        EXPECT_TRUE(pass);
-
-        // bf16
-        pass = ck::profiler::profile_conv_bwd_weight_impl<3,
-                                                          ck::tensor_layout::convolution::NDHWC,
-                                                          ck::tensor_layout::convolution::KZYXC,
-                                                          ck::tensor_layout::convolution::NDHWK,
-                                                          ck::bhalf_t,
-                                                          ck::bhalf_t,
-                                                          ck::bhalf_t>(true,  // do_verification
-                                                                       1,     // init_method
-                                                                       false, // do_log
-                                                                       false, // time_kernel
-                                                                       param,
-                                                                       2);
-
-        EXPECT_TRUE(pass);
-    }
+    this->template Run<3>();
 }
--- a/test/convnd_fwd/convnd_fwd.cpp
+++ b/test/convnd_fwd/convnd_fwd.cpp
@@ -5,237 +5,88 @@
 #include <iostream>
 #include <initializer_list>
 #include <vector>
+#include <tuple>
 #include <gtest/gtest.h>

 #include "profiler/include/profile_conv_fwd_impl.hpp"

+template <typename Tuple>
 class TestConvndFwd : public ::testing::Test
 {
    protected:
+    using DataType = std::tuple_element_t<0, Tuple>;
    std::vector<ck::utils::conv::ConvParam> conv_params;
-};

-// 1d
-TEST_F(TestConvndFwd, Conv1dFwd)
-{
-    conv_params.clear();
-    conv_params.push_back({1, 1, 128, 128, 256, {1}, {14}, {2}, {1}, {0}, {0}});
-    conv_params.push_back({1, 1, 128, 128, 256, {3}, {28}, {1}, {1}, {1}, {1}});
-    conv_params.push_back({1, 1, 128, 128, 256, {1}, {3}, {1}, {1}, {0}, {0}});
-
-    for(auto& param : conv_params)
+    template <ck::index_t NDimSpatial>
+    void Run()
    {
-        bool pass;
-
-        // fp32
-        pass = ck::profiler::profile_conv_fwd_impl<1,
-                                                   ck::tensor_layout::convolution::NWC,
-                                                   ck::tensor_layout::convolution::KXC,
-                                                   ck::tensor_layout::convolution::NWK,
-                                                   float,
-                                                   float,
-                                                   float>(true,  // do_verification
-                                                          1,     // init_method
-                                                          false, // do_log
-                                                          false, // time_kernel
-                                                          param);
-
-        EXPECT_TRUE(pass);
-
-        // fp16
-        pass = ck::profiler::profile_conv_fwd_impl<1,
-                                                   ck::tensor_layout::convolution::NWC,
-                                                   ck::tensor_layout::convolution::KXC,
-                                                   ck::tensor_layout::convolution::NWK,
-                                                   ck::half_t,
-                                                   ck::half_t,
-                                                   ck::half_t>(true,  // do_verification
-                                                               1,     // init_method
-                                                               false, // do_log
-                                                               false, // time_kernel
-                                                               param);
-
-        EXPECT_TRUE(pass);
-
-        // bf16
-        pass = ck::profiler::profile_conv_fwd_impl<1,
-                                                   ck::tensor_layout::convolution::NWC,
-                                                   ck::tensor_layout::convolution::KXC,
-                                                   ck::tensor_layout::convolution::NWK,
-                                                   ck::bhalf_t,
-                                                   ck::bhalf_t,
-                                                   ck::bhalf_t>(true,  // do_verification
-                                                                1,     // init_method
-                                                                false, // do_log
-                                                                false, // time_kernel
-                                                                param);
-
-        EXPECT_TRUE(pass);
+        for(auto& param : conv_params)
+        {
+            bool pass;
+            EXPECT_FALSE(conv_params.empty());
+            pass = ck::profiler::profile_conv_fwd_impl<
+                NDimSpatial,
+                ck::tuple_element_t<NDimSpatial - 1,
+                                    ck::Tuple<ck::tensor_layout::convolution::NWC,
+                                              ck::tensor_layout::convolution::NHWC,
+                                              ck::tensor_layout::convolution::NDHWC>>,
+                ck::tuple_element_t<NDimSpatial - 1,
+                                    ck::Tuple<ck::tensor_layout::convolution::KXC,
+                                              ck::tensor_layout::convolution::KYXC,
+                                              ck::tensor_layout::convolution::KZYXC>>,
+                ck::tuple_element_t<NDimSpatial - 1,
+                                    ck::Tuple<ck::tensor_layout::convolution::NWK,
+                                              ck::tensor_layout::convolution::NHWK,
+                                              ck::tensor_layout::convolution::NDHWK>>,
+                DataType,
+                DataType,
+                DataType>(true,  // do_verification
+                          1,     // init_method integer value
+                          false, // do_log
+                          false, // time_kernel
+                          param);
+            EXPECT_TRUE(pass);
+        }
+    }
+};

-        // int8
-        pass = ck::profiler::profile_conv_fwd_impl<1,
-                                                   ck::tensor_layout::convolution::NWC,
-                                                   ck::tensor_layout::convolution::KXC,
-                                                   ck::tensor_layout::convolution::NWK,
-                                                   int8_t,
-                                                   int8_t,
-                                                   int8_t>(true,  // do_verification
-                                                           1,     // init_method
-                                                           false, // do_log
-                                                           false, // time_kernel
-                                                           param);
+using KernelTypes = ::testing::Types<std::tuple<float>,
+                                     std::tuple<ck::half_t>,
+                                     std::tuple<ck::bhalf_t>,
+                                     std::tuple<std::int8_t>>;
+TYPED_TEST_SUITE(TestConvndFwd, KernelTypes);

-        EXPECT_TRUE(pass);
-    }
+// 1d
+TYPED_TEST(TestConvndFwd, Conv1dFwd)
+{
+    this->conv_params.clear();
+    this->conv_params.push_back({1, 1, 128, 128, 256, {1}, {14}, {2}, {1}, {0}, {0}});
+    this->conv_params.push_back({1, 1, 128, 128, 256, {3}, {28}, {1}, {1}, {1}, {1}});
+    this->conv_params.push_back({1, 1, 128, 128, 256, {1}, {3}, {1}, {1}, {0}, {0}});
+    this->template Run<1>();
 }

 // 2d
-TEST_F(TestConvndFwd, Conv2dFwd)
+TYPED_TEST(TestConvndFwd, Conv2dFwd)
 {
-    conv_params.clear();
-    conv_params.push_back({2, 1, 128, 128, 256, {1, 1}, {7, 7}, {2, 2}, {1, 1}, {0, 0}, {0, 0}});
-    conv_params.push_back({2, 1, 128, 128, 256, {3, 3}, {14, 14}, {1, 1}, {1, 1}, {1, 1}, {1, 1}});
-    conv_params.push_back({2, 1, 128, 128, 256, {1, 1}, {3, 3}, {1, 1}, {1, 1}, {0, 0}, {0, 0}});
-
-    for(auto& param : conv_params)
-    {
-        bool pass;
-
-        // fp32
-        pass = ck::profiler::profile_conv_fwd_impl<2,
-                                                   ck::tensor_layout::convolution::NHWC,
-                                                   ck::tensor_layout::convolution::KYXC,
-                                                   ck::tensor_layout::convolution::NHWK,
-                                                   float,
-                                                   float,
-                                                   float>(true,  // do_verification
-                                                          1,     // init_method
-                                                          false, // do_log
-                                                          false, // time_kernel
-                                                          param);
-
-        EXPECT_TRUE(pass);
-
-        // fp16
-        pass = ck::profiler::profile_conv_fwd_impl<2,
-                                                   ck::tensor_layout::convolution::NHWC,
-                                                   ck::tensor_layout::convolution::KYXC,
-                                                   ck::tensor_layout::convolution::NHWK,
-                                                   ck::half_t,
-                                                   ck::half_t,
-                                                   ck::half_t>(true,  // do_verification
-                                                               1,     // init_method
-                                                               false, // do_log
-                                                               false, // time_kernel
-                                                               param);
-
-        EXPECT_TRUE(pass);
-
-        // bf16
-        pass = ck::profiler::profile_conv_fwd_impl<2,
-                                                   ck::tensor_layout::convolution::NHWC,
-                                                   ck::tensor_layout::convolution::KYXC,
-                                                   ck::tensor_layout::convolution::NHWK,
-                                                   ck::bhalf_t,
-                                                   ck::bhalf_t,
-                                                   ck::bhalf_t>(true,  // do_verification
-                                                                1,     // init_method
-                                                                false, // do_log
-                                                                false, // time_kernel
-                                                                param);
-
-        EXPECT_TRUE(pass);
-
-        // int8
-        pass = ck::profiler::profile_conv_fwd_impl<2,
-                                                   ck::tensor_layout::convolution::NHWC,
-                                                   ck::tensor_layout::convolution::KYXC,
-                                                   ck::tensor_layout::convolution::NHWK,
-                                                   int8_t,
-                                                   int8_t,
-                                                   int8_t>(true,  // do_verification
-                                                           1,     // init_method
-                                                           false, // do_log
-                                                           false, // time_kernel
-                                                           param);
-
-        EXPECT_TRUE(pass);
-    }
+    this->conv_params.clear();
+    this->conv_params.push_back(
+        {2, 1, 128, 128, 256, {1, 1}, {7, 7}, {2, 2}, {1, 1}, {0, 0}, {0, 0}});
+    this->conv_params.push_back(
+        {2, 1, 128, 128, 256, {3, 3}, {14, 14}, {1, 1}, {1, 1}, {1, 1}, {1, 1}});
+    this->conv_params.push_back(
+        {2, 1, 128, 128, 256, {1, 1}, {3, 3}, {1, 1}, {1, 1}, {0, 0}, {0, 0}});
+    this->template Run<2>();
 }
-
 // 3d
-TEST_F(TestConvndFwd, Conv3dFwd)
+TYPED_TEST(TestConvndFwd, Conv3dFwd)
 {
-    conv_params.clear();
-    conv_params.push_back(
+    this->conv_params.clear();
+    this->conv_params.push_back(
        {3, 1, 128, 128, 256, {1, 1, 1}, {7, 7, 7}, {2, 2, 2}, {1, 1, 1}, {0, 0, 0}, {0, 0, 0}});
-    conv_params.push_back(
+    this->conv_params.push_back(
        {3, 1, 128, 128, 256, {3, 3, 3}, {14, 14, 3}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}});
-    conv_params.push_back(
+    this->conv_params.push_back(
        {3, 1, 128, 128, 256, {1, 1, 1}, {3, 3, 3}, {1, 1, 1}, {1, 1, 1}, {0, 0, 0}, {0, 0, 0}});
-
-    for(auto& param : conv_params)
-    {
-        bool pass;
-
-        // fp32
-        pass = ck::profiler::profile_conv_fwd_impl<3,
-                                                   ck::tensor_layout::convolution::NDHWC,
-                                                   ck::tensor_layout::convolution::KZYXC,
-                                                   ck::tensor_layout::convolution::NDHWK,
-                                                   float,
-                                                   float,
-                                                   float>(true,  // do_verification
-                                                          1,     // init_method
-                                                          false, // do_log
-                                                          false, // time_kernel
-                                                          param);
-
-        EXPECT_TRUE(pass);
-
-        // fp16
-        pass = ck::profiler::profile_conv_fwd_impl<3,
-                                                   ck::tensor_layout::convolution::NDHWC,
-                                                   ck::tensor_layout::convolution::KZYXC,
-                                                   ck::tensor_layout::convolution::NDHWK,
-                                                   ck::half_t,
-                                                   ck::half_t,
-                                                   ck::half_t>(true,  // do_verification
-                                                               1,     // init_method
-                                                               false, // do_log
-                                                               false, // time_kernel
-                                                               param);
-
-        EXPECT_TRUE(pass);
-
-        // bf16
-        pass = ck::profiler::profile_conv_fwd_impl<3,
-                                                   ck::tensor_layout::convolution::NDHWC,
-                                                   ck::tensor_layout::convolution::KZYXC,
-                                                   ck::tensor_layout::convolution::NDHWK,
-                                                   ck::bhalf_t,
-                                                   ck::bhalf_t,
-                                                   ck::bhalf_t>(true,  // do_verification
-                                                                1,     // init_method
-                                                                false, // do_log
-                                                                false, // time_kernel
-                                                                param);
-
-        EXPECT_TRUE(pass);
-
-        // int8
-        pass = ck::profiler::profile_conv_fwd_impl<3,
-                                                   ck::tensor_layout::convolution::NDHWC,
-                                                   ck::tensor_layout::convolution::KZYXC,
-                                                   ck::tensor_layout::convolution::NDHWK,
-                                                   int8_t,
-                                                   int8_t,
-                                                   int8_t>(true,  // do_verification
-                                                           1,     // init_method
-                                                           false, // do_log
-                                                           false, // time_kernel
-                                                           param);
-
-        EXPECT_TRUE(pass);
-    }
+    this->template Run<3>();
 }
--- a/test/normalization/test_layernorm2d_util.hpp
+++ b/test/normalization/test_layernorm2d_util.hpp
@@ -9,7 +9,7 @@

 #include "ck/ck.hpp"
 #include "ck/utility/number.hpp"
-#include "ck/tensor_operation/gpu/device/device_normalization_impl.hpp"
+#include "ck/tensor_operation/gpu/device/impl/device_normalization_impl.hpp"

 #include "ck/library/utility/check_err.hpp"
 #include "ck/library/utility/host_tensor.hpp"