Commit cee2d38e authored by ltqin's avatar ltqin
Browse files

change name to PartitionedBlockwiseReduction_V2

parent 7a04ca2a
......@@ -62,7 +62,7 @@ struct BlockwiseSoftmax_V1
using ThreadClusterLengths_M_K = Sequence<MPerBlock, WaveSize / MPerXDL>;
using BlockwiseMaxReduce =
PartitionedBlockwiseReduction2<AccDataType,
PartitionedBlockwiseReduction_V2<AccDataType,
BlockSize,
ThreadClusterLengths_M_K,
BlockToMKMap_M0_K_M1Adapt,
......@@ -71,7 +71,7 @@ struct BlockwiseSoftmax_V1
detail::AccumulateWithNanIgnore<reduce::Max, AccDataType>>;
using BlockwiseSumReduce =
PartitionedBlockwiseReduction2<AccDataType,
PartitionedBlockwiseReduction_V2<AccDataType,
BlockSize,
ThreadClusterLengths_M_K,
BlockToMKMap_M0_K_M1Adapt,
......
......@@ -97,7 +97,7 @@ template <typename AccDataType,
bool PropagateNan,
typename Accumulation =
detail::AccumulateWithNanCheck<PropagateNan, OpReduce, AccDataType>>
struct PartitionedBlockwiseReduction2
struct PartitionedBlockwiseReduction_V2
{
static_assert(BlockSize == ThreadClusterLengths_M_K::At(0) * ThreadClusterLengths_M_K::At(1),
"The product of cluster lengths should be same as BlockSize!");
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment