Commit 6cc03335 authored by Harisankar Sadasivan's avatar Harisankar Sadasivan
Browse files

added stream-k policies for 3 tile and 4 tile

parent 03c25255
...@@ -1471,6 +1471,16 @@ struct BlockToCTileMap_GemmStreamK_v2 ...@@ -1471,6 +1471,16 @@ struct BlockToCTileMap_GemmStreamK_v2
{ {
sk_tiles = bigEnough ? (grid_size + num_tiles % grid_size) : num_tiles; sk_tiles = bigEnough ? (grid_size + num_tiles % grid_size) : num_tiles;
} }
else if(streamk_sel == 3)
{
sk_tiles = (num_tiles > (2 * grid_size)) ? (2 * grid_size + num_tiles % grid_size)
: num_tiles;
}
else if(streamk_sel == 4)
{
sk_tiles = (num_tiles > (3 * grid_size)) ? (3 * grid_size + num_tiles % grid_size)
: num_tiles;
}
sk_num_blocks = sk_tiles; sk_num_blocks = sk_tiles;
// if(sk_tiles < sk_num_blocks) // if(sk_tiles < sk_num_blocks)
// { // {
......
...@@ -153,7 +153,7 @@ bool profile_gemm_universal_streamk_impl(int do_verification, ...@@ -153,7 +153,7 @@ bool profile_gemm_universal_streamk_impl(int do_verification,
for(auto& op_ptr : op_ptrs) for(auto& op_ptr : op_ptrs)
{ {
std::vector<int> grid_size_list = {38, 76, 114, 152, 190, 228, 266, 304, 342, 380}; std::vector<int> grid_size_list = {38, 76, 114, 152, 190, 228, 266, 304, 342, 380};
std::vector<int> streamk_sel_list = {0, 1, 2}; std::vector<int> streamk_sel_list = {0, 1, 2, 3, 4};
if(Grid_size == -1) if(Grid_size == -1)
{ {
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment