Commit c521ee62 authored by Jianfeng yan's avatar Jianfeng yan
Browse files

fixed segm fault caused by a typo in creating a/b_grid_desc

parent 09b9ddb3
...@@ -586,8 +586,8 @@ struct DeviceGemmXdlSplitKCShuffle ...@@ -586,8 +586,8 @@ struct DeviceGemmXdlSplitKCShuffle
const auto AKSplitted = AKPad / k_batch; const auto AKSplitted = AKPad / k_batch;
const auto BKSplitted = BKPad / k_batch; const auto BKSplitted = BKPad / k_batch;
a_grid_desc_ak0_m_ak1_ = DeviceOp::MakeAGridDescriptor_AK0_M_AK1(MRaw, AKPad, StrideA); a_grid_desc_ak0_m_ak1_ = DeviceOp::MakeAGridDescriptor_AK0_M_AK1(MRaw, AKSplitted, StrideA);
b_grid_desc_bk0_n_bk1_ = DeviceOp::MakeBGridDescriptor_BK0_N_BK1(BKPad, NRaw, StrideB); b_grid_desc_bk0_n_bk1_ = DeviceOp::MakeBGridDescriptor_BK0_N_BK1(BKSplitted, NRaw, StrideB);
c_grid_desc_m_n_ = DeviceOp::MakeCGridDescriptor_M_N(MRaw, NRaw, StrideC); c_grid_desc_m_n_ = DeviceOp::MakeCGridDescriptor_M_N(MRaw, NRaw, StrideC);
if(GridwiseGemm::CheckValidity( if(GridwiseGemm::CheckValidity(
...@@ -626,6 +626,19 @@ struct DeviceGemmXdlSplitKCShuffle ...@@ -626,6 +626,19 @@ struct DeviceGemmXdlSplitKCShuffle
block_2_ctile_map_ = MakeBlock2CTileMap(BatchCount_, c_grid_desc_m_n_, 1, 1); block_2_ctile_map_ = MakeBlock2CTileMap(BatchCount_, c_grid_desc_m_n_, 1, 1);
} }
for(int batch=0; batch<BatchCount_; ++batch)
{
printf("batch = %d, ptr_offset = [%ld, %ld, %ld]\n", batch, compute_ptr_offset_of_batch_.GetAPtrOffset(batch), compute_ptr_offset_of_batch_.GetBPtrOffset(batch), compute_ptr_offset_of_batch_.GetCPtrOffset(batch));
}
const index_t grid_size =
GridwiseGemm::CalculateGridSize(c_grid_desc_m_n_) * BatchCount_;
for (int blk=0; blk<grid_size; ++blk)
{
const auto ctile_idx = block_2_ctile_map_.CalculateBottomIndex(make_multi_index(blk));
printf("blk= %d, ctile_idx = [%d, %d]\n", blk, ctile_idx[I0], ctile_idx[I1]);
}
} }
// private: // private:
......
...@@ -45,4 +45,3 @@ add_subdirectory(grouped_gemm) ...@@ -45,4 +45,3 @@ add_subdirectory(grouped_gemm)
add_subdirectory(convnd_fwd) add_subdirectory(convnd_fwd)
add_subdirectory(reduce) add_subdirectory(reduce)
add_subdirectory(conv2d_bwd_weight) add_subdirectory(conv2d_bwd_weight)
add_subdirectory(fp16_transfer_bf16)
\ No newline at end of file
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment