Commit 52c018b7 authored by mtgu0705's avatar mtgu0705
Browse files

fix bug, function pass.

parent 78314c0b
...@@ -365,10 +365,10 @@ struct BlockwiseGemmXdlops_pipeline_bpreshuffle_v1<BlockGemmPipelineScheduler::I ...@@ -365,10 +365,10 @@ struct BlockwiseGemmXdlops_pipeline_bpreshuffle_v1<BlockGemmPipelineScheduler::I
// B VGPR->VGPR dequant // B VGPR->VGPR dequant
b_thread_dequant_copy.Run(b_block_desc_n0_n1_k0_k1, b_thread_dequant_copy.Run(b_block_desc_n0_n1_k0_k1,
b_block_origin_idx, b_block_origin_idx,
b_thread_bufs(mfma_reg_buf), b_thread_bufs(local_read_buf),
b_thread_desc_, b_thread_desc_,
make_tuple(I0, I0, I0, I0), make_tuple(I0, I0, I0, I0),
b_thread_dequant_bufs(mfma_reg_buf)); b_thread_dequant_bufs(local_read_buf));
HotLoopScheduler(); HotLoopScheduler();
__builtin_amdgcn_sched_barrier(0); __builtin_amdgcn_sched_barrier(0);
......
...@@ -1620,7 +1620,7 @@ struct GridwiseGemm_xdl_cshuffle_v3_b_preshuffle ...@@ -1620,7 +1620,7 @@ struct GridwiseGemm_xdl_cshuffle_v3_b_preshuffle
decltype(b_block_desc_bk0_n_bk1), decltype(b_block_desc_bk0_n_bk1),
tensor_operation::element_wise::PassThrough, tensor_operation::element_wise::PassThrough,
Sequence<Number<NXdlPerWave>{}, I1, Number<KRepeat>{}, Number<BK1Value>{}>, Sequence<Number<NXdlPerWave>{}, I1, Number<KRepeat>{}, Number<BK1Value>{}>,
Sequence<0, 1, 2, 3>, Sequence<1, 2, 0, 3>,
3, 3,
BK1Number>(b_element_op); BK1Number>(b_element_op);
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment