Undo some changes

65a0dafd · Umang Yadav · 0e97ebaa · 65a0dafd · 65a0dafd · 65a0dafd
Commit 65a0dafd authored Sep 29, 2023 by Umang Yadav
8 changed files
--- a/include/ck/tensor_operation/gpu/device/impl/device_grouped_conv_bwd_weight_xdl_cshuffle.hpp
+++ b/include/ck/tensor_operation/gpu/device/impl/device_grouped_conv_bwd_weight_xdl_cshuffle.hpp
@@ -1442,9 +1442,8 @@ struct DeviceGroupedConvBwdWeight_Xdl_CShuffle
                        out_element_op,
                        split_k};
    }
-#ifndef __HIPCC_RTC__
    static auto MakeInvoker() { return Invoker{}; }
-#endif
    std::unique_ptr<BaseArgument>
    MakeArgumentPointer(const void* p_in_grid,

--- a/include/ck/tensor_operation/gpu/device/impl/device_grouped_conv_fwd_dl_multiple_d_nhwc_kyxc_nhwk.hpp
+++ b/include/ck/tensor_operation/gpu/device/impl/device_grouped_conv_fwd_dl_multiple_d_nhwc_kyxc_nhwk.hpp
@@ -2,16 +2,12 @@
 // Copyright (c) 2018-2023, Advanced Micro Devices, Inc. All rights reserved.
 #pragma once
-#ifndef __HIPCC_RTC__
 #include <functional>
 #include <iostream>
 #include <iterator>
 #include <numeric>
 #include <sstream>
-#include "ck/host_utility/device_prop.hpp"
-#include "ck/host_utility/kernel_launch.hpp"
-#include "ck/host_utility/io.hpp"
-#endif
 #include "ck/utility/common_header.hpp"
 #include "ck/tensor_description/tensor_descriptor.hpp"
@@ -23,6 +19,9 @@
 #include "ck/tensor_operation/gpu/device/gemm_specialization.hpp"
 #include "ck/tensor_operation/gpu/device/matrix_padder.hpp"
 #include "ck/tensor_operation/gpu/grid/gridwise_gemm_dl_multiple_d.hpp"
+#include "ck/host_utility/device_prop.hpp"
+#include "ck/host_utility/kernel_launch.hpp"
+#include "ck/host_utility/io.hpp"
 namespace ck {
 namespace tensor_operation {
@@ -544,7 +543,7 @@ struct DeviceGroupedConvFwdDlMultipleD_NHWC_KYXC_NHWK
                block_2_ctile_map_ = GridwiseGemm::MakeDefaultBlock2CTileMap(e_grid_desc_m_n_);
            }
        }
-#ifndef __HIPCC_RTC__
        void Print() const
        {
            std::cout << "A[K0, M, K1]: " << a_grid_desc_ak0_m_ak1_ << std::endl;
@@ -557,7 +556,6 @@ struct DeviceGroupedConvFwdDlMultipleD_NHWC_KYXC_NHWK
            std::cout << "A[m0, m10, m11, n0, n10, n11]: " << e_grid_desc_m0_m10_m11_n0_n10_n11_
                      << std::endl;
        }
-#endif
        //  private:
        // pointers
@@ -706,7 +704,7 @@ struct DeviceGroupedConvFwdDlMultipleD_NHWC_KYXC_NHWK
            return Run(*dynamic_cast<const Argument*>(p_arg), stream_config);
        }
    };
-#ifndef __HIPCC_RTC__
    static bool IsSupportedArgument(const Argument& arg)
    {
        namespace ctc = tensor_layout::convolution;
@@ -851,7 +849,7 @@ struct DeviceGroupedConvFwdDlMultipleD_NHWC_KYXC_NHWK
    {
        return IsSupportedArgument(*dynamic_cast<const Argument*>(p_arg));
    }
-#endif
    static auto MakeArgument(
        const void* p_a,
        const void* p_b,
@@ -893,9 +891,9 @@ struct DeviceGroupedConvFwdDlMultipleD_NHWC_KYXC_NHWK
                        b_element_op,
                        cde_element_op};
    }
-#ifndef __HIPCC_RTC__
    static auto MakeInvoker() { return Invoker{}; }
-#endif
    std::unique_ptr<BaseArgument> MakeArgumentPointer(
        const void* p_a,
        const void* p_b,

--- a/include/ck/tensor_operation/gpu/device/impl/device_grouped_conv_fwd_dl_nhwc_kyxc_nhwk.hpp
+++ b/include/ck/tensor_operation/gpu/device/impl/device_grouped_conv_fwd_dl_nhwc_kyxc_nhwk.hpp
@@ -595,7 +595,7 @@ struct DeviceGroupedConvFwdDl_NHWC_KYXC_NHWK : public DeviceGroupedConvFwd<NDimS
            return Run(*dynamic_cast<const Argument*>(p_arg), stream_config);
        }
    };
-#ifndef __HIPCC_RTC__
    static bool IsSupportedArgument(const Argument& arg)
    {
        namespace ctc = tensor_layout::convolution;
@@ -737,7 +737,7 @@ struct DeviceGroupedConvFwdDl_NHWC_KYXC_NHWK : public DeviceGroupedConvFwd<NDimS
    {
        return IsSupportedArgument(*dynamic_cast<const Argument*>(p_arg));
    }
-#endif
    static auto MakeArgument(const void* p_a,
                             const void* p_b,
                             void* p_c,
@@ -773,9 +773,7 @@ struct DeviceGroupedConvFwdDl_NHWC_KYXC_NHWK : public DeviceGroupedConvFwd<NDimS
                        c_element_op};
    }
-#ifndef __HIPCC_RTC__
    static auto MakeInvoker() { return Invoker{}; }
-#endif
    std::unique_ptr<BaseArgument>
    MakeArgumentPointer(const void* p_a,

--- a/include/ck/tensor_operation/gpu/device/impl/device_grouped_conv_fwd_multiple_d_multiple_r_xdl_cshuffle.hpp
+++ b/include/ck/tensor_operation/gpu/device/impl/device_grouped_conv_fwd_multiple_d_multiple_r_xdl_cshuffle.hpp
@@ -1025,9 +1025,8 @@ struct DeviceGroupedConvFwdMultipleDMultipleR_Xdl_CShuffle
                        qs_element_op,
                        rs_element_op};
    }
-#ifndef __HIPCC_RTC__
    static auto MakeInvoker() { return Invoker{}; }
-#endif
    std::unique_ptr<BaseArgument> MakeArgumentPointer(
        const void* p_a,

--- a/include/ck/tensor_operation/gpu/device/impl/device_grouped_conv_fwd_multiple_d_wmma_cshuffle.hpp
+++ b/include/ck/tensor_operation/gpu/device/impl/device_grouped_conv_fwd_multiple_d_wmma_cshuffle.hpp
@@ -775,9 +775,8 @@ struct DeviceGroupedConvFwdMultipleD_Wmma_CShuffle
                        b_element_op,
                        cde_element_op};
    }
-#ifndef __HIPCC_RTC__
    static auto MakeInvoker() { return Invoker{}; }
-#endif
    std::unique_ptr<BaseArgument> MakeArgumentPointer(
        const void* p_a,

--- a/include/ck/tensor_operation/gpu/device/impl/device_grouped_conv_fwd_multiple_d_xdl_cshuffle.hpp
+++ b/include/ck/tensor_operation/gpu/device/impl/device_grouped_conv_fwd_multiple_d_xdl_cshuffle.hpp
@@ -884,9 +884,8 @@ struct DeviceGroupedConvFwdMultipleD_Xdl_CShuffle
                        b_element_op,
                        cde_element_op};
    }
-#ifndef __HIPCC_RTC__
    static auto MakeInvoker() { return Invoker{}; }
-#endif
    std::unique_ptr<BaseArgument> MakeArgumentPointer(
        const void* p_a,

--- a/include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_multiple_d_dl.hpp
+++ b/include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_multiple_d_dl.hpp
@@ -708,9 +708,8 @@ struct DeviceGroupedGemmMultipleD_Dl : public DeviceGroupedGemm<ALayout,
        return Argument{
            p_As, p_Bs, p_Ds, p_Es, gemm_descs, a_element_op, b_element_op, cde_element_op};
    }
-#ifndef __HIPCC_RTC__
    static auto MakeInvoker() { return Invoker{}; }
-#endif
    // polymorphic
    std::unique_ptr<BaseArgument>

--- a/include/ck/tensor_operation/gpu/grid/gridwise_gemm_pipeline_selector.hpp
+++ b/include/ck/tensor_operation/gpu/grid/gridwise_gemm_pipeline_selector.hpp
@@ -39,7 +39,9 @@ constexpr auto GridwiseGemmPipeline_Selector()
    }
    else
    {
-        // std::cerr << "GridwiseGemmPipeline configuration is not available" << std::endl;
+#ifndef __HIPCC_RTC__
+        std::cerr << "GridwiseGemmPipeline configuration is not available" << std::endl;
+#endif
    }
 }