Commit 5392333a authored by rocking's avatar rocking
Browse files

Refine var name

parent 441d8973
...@@ -69,12 +69,12 @@ struct GridwiseWelfordSecondHalfLayernorm2d ...@@ -69,12 +69,12 @@ struct GridwiseWelfordSecondHalfLayernorm2d
static constexpr auto thread_buffer_desc_n = static constexpr auto thread_buffer_desc_n =
make_naive_tensor_descriptor_packed(make_tuple(Number<NThreadSliceSize>{})); make_naive_tensor_descriptor_packed(make_tuple(Number<NThreadSliceSize>{}));
using ThreadReduceSrcDesc_M_1 = decltype(thread_buffer_desc_m_1); using ThreadWelfordSrcDesc_M_1 = decltype(thread_buffer_desc_m_1);
using ThreadReduceDstDesc_M = using ThreadWelfordDstDesc_M =
decltype(make_naive_tensor_descriptor_packed(make_tuple(Number<MThreadSliceSize>{}))); decltype(make_naive_tensor_descriptor_packed(make_tuple(Number<MThreadSliceSize>{})));
using ThreadwiseWelford = using ThreadwiseWelford =
ThreadwiseWelfordMerge<ComputeDataType, ThreadReduceSrcDesc_M_1, ThreadReduceDstDesc_M>; ThreadwiseWelfordMerge<ComputeDataType, ThreadWelfordSrcDesc_M_1, ThreadWelfordDstDesc_M>;
using BlockwiseWelford = BlockwiseWelford<ComputeDataType, using BlockwiseWelford = BlockwiseWelford<ComputeDataType,
BlockSize, BlockSize,
...@@ -298,8 +298,7 @@ struct GridwiseWelfordSecondHalfLayernorm2d ...@@ -298,8 +298,7 @@ struct GridwiseWelfordSecondHalfLayernorm2d
welford_count_thread_buf(I) = 0; welford_count_thread_buf(I) = 0;
}); });
for(index_t reducedTiles = 0; reducedTiles < numMeanVarCountBlockTileIteration_N; for(index_t n = 0; n < numMeanVarCountBlockTileIteration_N; ++n)
++reducedTiles)
{ {
threadwise_mean_load_m_nblock.Run(mean_var_grid_desc_m_n, threadwise_mean_load_m_nblock.Run(mean_var_grid_desc_m_n,
welford_mean_global_val_buf, welford_mean_global_val_buf,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment