Commit 629257f9 authored by rocking's avatar rocking
Browse files

Remove fp32 instances

parent ba5d34aa
...@@ -9,7 +9,7 @@ auto create_args(int argc, char* argv[]) ...@@ -9,7 +9,7 @@ auto create_args(int argc, char* argv[])
.insert("n", "4096", "m dimension") .insert("n", "4096", "m dimension")
.insert("e", "1e-5", "epsilon") .insert("e", "1e-5", "epsilon")
.insert("v", "1", "cpu validation or not") .insert("v", "1", "cpu validation or not")
.insert("prec", "fp32", "precision") .insert("prec", "fp16", "precision")
.insert("warmup", "5", "cold iter") .insert("warmup", "5", "cold iter")
.insert("repeat", "20", "hot iter"); .insert("repeat", "20", "hot iter");
......
...@@ -7,6 +7,7 @@ ...@@ -7,6 +7,7 @@
#include "layernorm_dispatch.hpp" #include "layernorm_dispatch.hpp"
// clang-format off // clang-format off
#ifdef CK_TILE_LAYERNORM2D_FWD_FP32_DEFAULT
template float run_layernorm<float, 1, 32, 4, false>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream); template float run_layernorm<float, 1, 32, 4, false>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream);
template float run_layernorm<float, 1, 64, 2, false>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream); template float run_layernorm<float, 1, 64, 2, false>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream);
template float run_layernorm<float, 1, 64, 4, false>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream); template float run_layernorm<float, 1, 64, 4, false>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream);
...@@ -31,4 +32,5 @@ template float run_layernorm<float, 8, 64, 4, true>(const layernorm2d_fwd_args& ...@@ -31,4 +32,5 @@ template float run_layernorm<float, 8, 64, 4, true>(const layernorm2d_fwd_args&
template float run_layernorm<float, 16, 64, 2, true>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream); template float run_layernorm<float, 16, 64, 2, true>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream);
template float run_layernorm<float, 8, 64, 4, true, true>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream); template float run_layernorm<float, 8, 64, 4, true, true>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream);
template float run_layernorm<float, 16, 64, 2, true, true>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream); template float run_layernorm<float, 16, 64, 2, true, true>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream);
#endif
// clang-format on // clang-format on
...@@ -112,6 +112,7 @@ float layernorm2d_fwd(layernorm2d_fwd_traits t, ...@@ -112,6 +112,7 @@ float layernorm2d_fwd(layernorm2d_fwd_traits t,
} }
} }
} }
#ifdef CK_TILE_LAYERNORM2D_FWD_FP32_DEFAULT
else if(t.data_type.compare("fp32") == 0) else if(t.data_type.compare("fp32") == 0)
{ {
if(a.N % 4 == 0) if(a.N % 4 == 0)
...@@ -181,6 +182,10 @@ float layernorm2d_fwd(layernorm2d_fwd_traits t, ...@@ -181,6 +182,10 @@ float layernorm2d_fwd(layernorm2d_fwd_traits t,
} }
} }
} }
#endif
if (r < 0)
throw std::runtime_error("Without supported instances!");
return r; return r;
} }
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment