Commit 629257f9 authored by rocking's avatar rocking
Browse files

Remove fp32 instances

parent ba5d34aa
......@@ -9,7 +9,7 @@ auto create_args(int argc, char* argv[])
.insert("n", "4096", "m dimension")
.insert("e", "1e-5", "epsilon")
.insert("v", "1", "cpu validation or not")
.insert("prec", "fp32", "precision")
.insert("prec", "fp16", "precision")
.insert("warmup", "5", "cold iter")
.insert("repeat", "20", "hot iter");
......
......@@ -7,6 +7,7 @@
#include "layernorm_dispatch.hpp"
// clang-format off
#ifdef CK_TILE_LAYERNORM2D_FWD_FP32_DEFAULT
template float run_layernorm<float, 1, 32, 4, false>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream);
template float run_layernorm<float, 1, 64, 2, false>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream);
template float run_layernorm<float, 1, 64, 4, false>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream);
......@@ -31,4 +32,5 @@ template float run_layernorm<float, 8, 64, 4, true>(const layernorm2d_fwd_args&
template float run_layernorm<float, 16, 64, 2, true>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream);
template float run_layernorm<float, 8, 64, 4, true, true>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream);
template float run_layernorm<float, 16, 64, 2, true, true>(const layernorm2d_fwd_args& param, ck_tile::stream_config stream);
#endif
// clang-format on
......@@ -112,6 +112,7 @@ float layernorm2d_fwd(layernorm2d_fwd_traits t,
}
}
}
#ifdef CK_TILE_LAYERNORM2D_FWD_FP32_DEFAULT
else if(t.data_type.compare("fp32") == 0)
{
if(a.N % 4 == 0)
......@@ -181,6 +182,10 @@ float layernorm2d_fwd(layernorm2d_fwd_traits t,
}
}
}
#endif
if (r < 0)
throw std::runtime_error("Without supported instances!");
return r;
}
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment