"...composable_kernel.git" did not exist on "d18428901eefc3908696397b62505180a7c50359"
Commit e0cd7f90 authored by aska-0096's avatar aska-0096
Browse files

change back to inline asm to realize lds sync

parent 84a1dfb0
...@@ -434,6 +434,9 @@ struct BlockwiseGemmXdlops_pipeline_v1 ...@@ -434,6 +434,9 @@ struct BlockwiseGemmXdlops_pipeline_v1
}); });
// Wait all wave consume this k-loop data // Wait all wave consume this k-loop data
// __syncthreads();
// __builtin_amdgcn_s_waitcnt(0);
// __builtin_amdgcn_s_barrier();
block_sync_lds(); block_sync_lds();
a_blockwise_copy.MoveSrcSliceWindow(a_grid_desc, a_block_copy_step); a_blockwise_copy.MoveSrcSliceWindow(a_grid_desc, a_block_copy_step);
...@@ -472,6 +475,9 @@ struct BlockwiseGemmXdlops_pipeline_v1 ...@@ -472,6 +475,9 @@ struct BlockwiseGemmXdlops_pipeline_v1
}); });
}); });
// Wait all wave produce next k-loop data // Wait all wave produce next k-loop data
// __syncthreads();
// __builtin_amdgcn_s_waitcnt(0);
// __builtin_amdgcn_s_barrier();
block_sync_lds(); block_sync_lds();
// Here 1 time prefetch read(idx=0) of next K-loop // Here 1 time prefetch read(idx=0) of next K-loop
static_for<0, MRepeat, 1>{}([&](auto m0) { static_for<0, MRepeat, 1>{}([&](auto m0) {
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment