Commit e0cd7f90 authored by aska-0096's avatar aska-0096
Browse files

change back to inline asm to realize lds sync

parent 84a1dfb0
......@@ -434,6 +434,9 @@ struct BlockwiseGemmXdlops_pipeline_v1
});
// Wait all wave consume this k-loop data
// __syncthreads();
// __builtin_amdgcn_s_waitcnt(0);
// __builtin_amdgcn_s_barrier();
block_sync_lds();
a_blockwise_copy.MoveSrcSliceWindow(a_grid_desc, a_block_copy_step);
......@@ -472,6 +475,9 @@ struct BlockwiseGemmXdlops_pipeline_v1
});
});
// Wait all wave produce next k-loop data
// __syncthreads();
// __builtin_amdgcn_s_waitcnt(0);
// __builtin_amdgcn_s_barrier();
block_sync_lds();
// Here 1 time prefetch read(idx=0) of next K-loop
static_for<0, MRepeat, 1>{}([&](auto m0) {
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment