Commit 9860dad8 authored by carlushuang's avatar carlushuang
Browse files

improve a little bit performance by reorganize pipeline.

parent b504e7a7
...@@ -63,8 +63,8 @@ struct GridwiseGemmPipeline_v3 ...@@ -63,8 +63,8 @@ struct GridwiseGemmPipeline_v3
while(num_loop > 0) while(num_loop > 0)
{ {
block_sync_lds();
a_blockwise_copy.RunRead(a_grid_desc, a_grid_buf); a_blockwise_copy.RunRead(a_grid_desc, a_grid_buf);
block_sync_lds();
b_blockwise_copy.RunRead(b_grid_desc, b_grid_buf); b_blockwise_copy.RunRead(b_grid_desc, b_grid_buf);
blockwise_gemm.Run(a_block_buf, b_block_buf, c_thread_buf); blockwise_gemm.Run(a_block_buf, b_block_buf, c_thread_buf);
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment