Commit d9ce3a57 authored by Po-Yen, Chen's avatar Po-Yen, Chen
Browse files

Fix format

parent b5f11e02
......@@ -29,8 +29,7 @@ using Instances =
>;
void add_device_gemm_xdl_f16_f16_f16_km_kn_mn_default_pipeline_v1_instances(
OwnerList<InstanceNT>&
instances)
OwnerList<InstanceNT>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -11,7 +11,7 @@ namespace instance {
// Compilation parameters for a[k, m] * b[k, n] = c[m, n]
using Instances =
std::tuple<
// clang-format off
// clang-format off
#if CK_EXPERIMENTAL_PIPELINE_V2_INSTANCES
// pipeline v2, 1 wave
//##########| AData| BData| CData| AccData| ALayout| BLayout| CLayout| A| B| C| GEMM| Block| MPer| NPer| K0Per| K1| MPer| NPer| MXdl| NXdl| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockLds| BBlockTransfer| BBlockTransfer| BBlockTransfer| BlockTransfer| BBlockTransfer| BBlockTransfer| BBlockLds| CThreadTransfer| CThreadTransfer| NumPrefetch| LoopScheduler| Pipeline|
......@@ -31,8 +31,7 @@ using Instances =
>;
void add_device_gemm_xdl_f16_f16_f16_km_kn_mn_default_pipeline_v2_instances(
OwnerList<InstanceNT>&
instances)
OwnerList<InstanceNT>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -11,7 +11,7 @@ namespace instance {
// Compilation parameters for a[k, m] * b[k, n] = c[m, n]
using Instances =
std::tuple<
// clang-format off
// clang-format off
#if CK_EXPERIMENTAL_INTER_WAVE_INSTANCES
// pipeline v1, 2 waves
//##########| AData| BData| CData| AccData| ALayout| BLayout| CLayout| A| B| C| GEMM| Block| MPer| NPer| K0Per| K1| MPer| NPer| MXdl| NXdl| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockLds| BBlockTransfer| BBlockTransfer| BBlockTransfer| BlockTransfer| BBlockTransfer| BBlockTransfer| BBlockLds| CThreadTransfer| CThreadTransfer| NumPrefetch| LoopScheduler| Pipeline|
......@@ -31,8 +31,7 @@ using Instances =
>;
void add_device_gemm_xdl_f16_f16_f16_km_kn_mn_interwave_pipeline_v1_instances(
OwnerList<InstanceNT>&
instances)
OwnerList<InstanceNT>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -21,8 +21,7 @@ using Instances = std::tuple<
>;
void add_device_gemm_xdl_f16_f16_f16_km_kn_mn_irregular_default_pipeline_v1_instances(
OwnerList<InstanceNT>&
instances)
OwnerList<InstanceNT>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -10,7 +10,7 @@ namespace instance {
// irregular tile size
using Instances = std::tuple<
// clang-format off
// clang-format off
#if CK_EXPERIMENTAL_PIPELINE_V2_INSTANCES
// pipeline v2, 1 wave
//###########| AData| BData| CData| AccData| ALayout| BLayout| CLayout| A| B| C| GEMM| Block| MPer| NPer| K0Per| K1| MPer| NPer| MXdl| NXdl| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockLds| BBlockTransfer| BBlockTransfer| BBlockTransfer| BlockTransfer| BBlockTransfer| BBlockTransfer| BBlockLds| CThreadTransfer| CThreadTransfer| NumPrefetch| LoopScheduler| Pipeline|
......@@ -23,8 +23,7 @@ using Instances = std::tuple<
>;
void add_device_gemm_xdl_f16_f16_f16_km_kn_mn_irregular_default_pipeline_v2_instances(
OwnerList<InstanceNT>&
instances)
OwnerList<InstanceNT>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -10,7 +10,7 @@ namespace instance {
// irregular tile size
using Instances = std::tuple<
// clang-format off
// clang-format off
#if CK_EXPERIMENTAL_INTER_WAVE_INSTANCES
// pipeline v1, 2 waves
//###########| AData| BData| CData| AccData| ALayout| BLayout| CLayout| A| B| C| GEMM| Block| MPer| NPer| K0Per| K1| MPer| NPer| MXdl| NXdl| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockLds| BBlockTransfer| BBlockTransfer| BBlockTransfer| BlockTransfer| BBlockTransfer| BBlockTransfer| BBlockLds| CThreadTransfer| CThreadTransfer| NumPrefetch| LoopScheduler| Pipeline|
......@@ -23,8 +23,7 @@ using Instances = std::tuple<
>;
void add_device_gemm_xdl_f16_f16_f16_km_kn_mn_irregular_interwave_pipeline_v1_instances(
OwnerList<InstanceNT>&
instances)
OwnerList<InstanceNT>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -29,8 +29,7 @@ using Instances =
>;
void add_device_gemm_xdl_f16_f16_f16_km_nk_mn_default_pipeline_v1_instances(
OwnerList<InstanceNN>&
instances)
OwnerList<InstanceNN>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -11,7 +11,7 @@ namespace instance {
// Compilation parameters for a[k, m] * b[n, k] = c[m, n]
using Instances =
std::tuple<
// clang-format off
// clang-format off
#if CK_EXPERIMENTAL_PIPELINE_V2_INSTANCES
// pipeline v2, 1 wave
//##########| AData| BData| CData| AccData| ALayout| BLayout| CLayout| A| B| C| GEMM| Block| MPer| NPer| K0Per| K1| MPer| NPer| MXdl| NXdl| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockLds| BBlockTransfer| BBlockTransfer| BBlockTransfer| BlockTransfer| BBlockTransfer| BBlockTransfer| BBlockLds| CThreadTransfer| CThreadTransfer| NumPrefetch| LoopScheduler| Pipeline|
......@@ -31,8 +31,7 @@ using Instances =
>;
void add_device_gemm_xdl_f16_f16_f16_km_nk_mn_default_pipeline_v2_instances(
OwnerList<InstanceNN>&
instances)
OwnerList<InstanceNN>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -11,7 +11,7 @@ namespace instance {
// Compilation parameters for a[k, m] * b[n, k] = c[m, n]
using Instances =
std::tuple<
// clang-format off
// clang-format off
#if CK_EXPERIMENTAL_INTER_WAVE_INSTANCES
// pipeline v1, 2 waves
//##########| AData| BData| CData| AccData| ALayout| BLayout| CLayout| A| B| C| GEMM| Block| MPer| NPer| K0Per| K1| MPer| NPer| MXdl| NXdl| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockLds| BBlockTransfer| BBlockTransfer| BBlockTransfer| BlockTransfer| BBlockTransfer| BBlockTransfer| BBlockLds| CThreadTransfer| CThreadTransfer| NumPrefetch| LoopScheduler| Pipeline|
......@@ -31,8 +31,7 @@ using Instances =
>;
void add_device_gemm_xdl_f16_f16_f16_km_nk_mn_interwave_pipeline_v1_instances(
OwnerList<InstanceNN>&
instances)
OwnerList<InstanceNN>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -21,8 +21,7 @@ using Instances = std::tuple<
>;
void add_device_gemm_xdl_f16_f16_f16_km_nk_mn_irregular_default_pipeline_v1_instances(
OwnerList<InstanceNN>&
instances)
OwnerList<InstanceNN>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -10,7 +10,7 @@ namespace instance {
// irregular tile size
using Instances = std::tuple<
// clang-format off
// clang-format off
#if CK_EXPERIMENTAL_PIPELINE_V2_INSTANCES
// pipeline v2, 1 wave
//###########| AData| BData| CData| AccData| ALayout| BLayout| CLayout| A| B| C| GEMM| Block| MPer| NPer| K0Per| K1| MPer| NPer| MXdl| NXdl| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockLds| BBlockTransfer| BBlockTransfer| BBlockTransfer| BlockTransfer| BBlockTransfer| BBlockTransfer| BBlockLds| CThreadTransfer| CThreadTransfer| NumPrefetch| LoopScheduler| Pipeline|
......@@ -23,8 +23,7 @@ using Instances = std::tuple<
>;
void add_device_gemm_xdl_f16_f16_f16_km_nk_mn_irregular_default_pipeline_v2_instances(
OwnerList<InstanceNN>&
instances)
OwnerList<InstanceNN>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -10,7 +10,7 @@ namespace instance {
// irregular tile size
using Instances = std::tuple<
// clang-format off
// clang-format off
#if CK_EXPERIMENTAL_INTER_WAVE_INSTANCES
// pipeline v1, 2 waves
//###########| AData| BData| CData| AccData| ALayout| BLayout| CLayout| A| B| C| GEMM| Block| MPer| NPer| K0Per| K1| MPer| NPer| MXdl| NXdl| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockLds| BBlockTransfer| BBlockTransfer| BBlockTransfer| BlockTransfer| BBlockTransfer| BBlockTransfer| BBlockLds| CThreadTransfer| CThreadTransfer| NumPrefetch| LoopScheduler| Pipeline|
......@@ -23,8 +23,7 @@ using Instances = std::tuple<
>;
void add_device_gemm_xdl_f16_f16_f16_km_nk_mn_irregular_interwave_pipeline_v1_instances(
OwnerList<InstanceNN>&
instances)
OwnerList<InstanceNN>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -38,8 +38,7 @@ using Instances =
>;
void add_device_gemm_xdl_f16_f16_f16_mk_kn_mn_default_pipeline_v1_instances(
OwnerList<InstanceTT>&
instances)
OwnerList<InstanceTT>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -11,7 +11,7 @@ namespace instance {
// Compilation parameters for a[m, k] * b[k, n] = c[m, n]
using Instances =
std::tuple<
// clang-format off
// clang-format off
#if CK_EXPERIMENTAL_PIPELINE_V2_INSTANCES
// pipeline v2, 1 wave
//##########| AData| BData| CData| AccData| ALayout| BLayout| CLayout| A| B| C| GEMM| Block| MPer| NPer| K0Per| K1| MPer| NPer| MXdl| NXdl| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockLds| BBlockTransfer| BBlockTransfer| BBlockTransfer| BlockTransfer| BBlockTransfer| BBlockTransfer| BBlockLds| CThreadTransfer| CThreadTransfer| NumPrefetch| LoopScheduler| Pipeline|
......@@ -40,8 +40,7 @@ using Instances =
>;
void add_device_gemm_xdl_f16_f16_f16_mk_kn_mn_default_pipeline_v2_instances(
OwnerList<InstanceTT>&
instances)
OwnerList<InstanceTT>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -11,7 +11,7 @@ namespace instance {
// Compilation parameters for a[m, k] * b[k, n] = c[m, n]
using Instances =
std::tuple<
// clang-format off
// clang-format off
#if CK_EXPERIMENTAL_INTER_WAVE_INSTANCES
// pipeline v1, 2 waves
//##########| AData| BData| CData| AccData| ALayout| BLayout| CLayout| A| B| C| GEMM| Block| MPer| NPer| K0Per| K1| MPer| NPer| MXdl| NXdl| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockLds| BBlockTransfer| BBlockTransfer| BBlockTransfer| BlockTransfer| BBlockTransfer| BBlockTransfer| BBlockLds| CThreadTransfer| CThreadTransfer| NumPrefetch| LoopScheduler| Pipeline|
......@@ -40,8 +40,7 @@ using Instances =
>;
void add_device_gemm_xdl_f16_f16_f16_mk_kn_mn_interwave_pipeline_v1_instances(
OwnerList<InstanceTT>&
instances)
OwnerList<InstanceTT>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -21,8 +21,7 @@ using Instances = std::tuple<
>;
void add_device_gemm_xdl_f16_f16_f16_mk_kn_mn_irregular_default_pipeline_v1_instances(
OwnerList<InstanceTT>&
instances)
OwnerList<InstanceTT>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
......@@ -10,7 +10,7 @@ namespace instance {
// irregular tile size
using Instances = std::tuple<
// clang-format off
// clang-format off
#if CK_EXPERIMENTAL_PIPELINE_V2_INSTANCES
// pipeline v2, 1 wave
//###########| AData| BData| CData| AccData| ALayout| BLayout| CLayout| A| B| C| GEMM| Block| MPer| NPer| K0Per| K1| MPer| NPer| MXdl| NXdl| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockTransfer| ABlockLds| BBlockTransfer| BBlockTransfer| BBlockTransfer| BlockTransfer| BBlockTransfer| BBlockTransfer| BBlockLds| CThreadTransfer| CThreadTransfer| NumPrefetch| LoopScheduler| Pipeline|
......@@ -23,8 +23,7 @@ using Instances = std::tuple<
>;
void add_device_gemm_xdl_f16_f16_f16_mk_kn_mn_irregular_default_pipeline_v2_instances(
OwnerList<InstanceTT>&
instances)
OwnerList<InstanceTT>& instances)
{
add_device_operation_instances(instances, Instances{});
}
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment