Commit cee2d38e authored by ltqin's avatar ltqin
Browse files

change name to PartitionedBlockwiseReduction_V2

parent 7a04ca2a
...@@ -62,22 +62,22 @@ struct BlockwiseSoftmax_V1 ...@@ -62,22 +62,22 @@ struct BlockwiseSoftmax_V1
using ThreadClusterLengths_M_K = Sequence<MPerBlock, WaveSize / MPerXDL>; using ThreadClusterLengths_M_K = Sequence<MPerBlock, WaveSize / MPerXDL>;
using BlockwiseMaxReduce = using BlockwiseMaxReduce =
PartitionedBlockwiseReduction2<AccDataType, PartitionedBlockwiseReduction_V2<AccDataType,
BlockSize, BlockSize,
ThreadClusterLengths_M_K, ThreadClusterLengths_M_K,
BlockToMKMap_M0_K_M1Adapt, BlockToMKMap_M0_K_M1Adapt,
reduce::Max, reduce::Max,
false, // param ignored false, // param ignored
detail::AccumulateWithNanIgnore<reduce::Max, AccDataType>>; detail::AccumulateWithNanIgnore<reduce::Max, AccDataType>>;
using BlockwiseSumReduce = using BlockwiseSumReduce =
PartitionedBlockwiseReduction2<AccDataType, PartitionedBlockwiseReduction_V2<AccDataType,
BlockSize, BlockSize,
ThreadClusterLengths_M_K, ThreadClusterLengths_M_K,
BlockToMKMap_M0_K_M1Adapt, BlockToMKMap_M0_K_M1Adapt,
reduce::Add, reduce::Add,
false, // ignored false, // ignored
detail::AccumulateWithNanIgnore<reduce::Add, AccDataType>>; detail::AccumulateWithNanIgnore<reduce::Add, AccDataType>>;
using ThreadwiseSumReduce = using ThreadwiseSumReduce =
ThreadwiseReduction<AccDataType, ThreadwiseReduction<AccDataType,
......
...@@ -97,7 +97,7 @@ template <typename AccDataType, ...@@ -97,7 +97,7 @@ template <typename AccDataType,
bool PropagateNan, bool PropagateNan,
typename Accumulation = typename Accumulation =
detail::AccumulateWithNanCheck<PropagateNan, OpReduce, AccDataType>> detail::AccumulateWithNanCheck<PropagateNan, OpReduce, AccDataType>>
struct PartitionedBlockwiseReduction2 struct PartitionedBlockwiseReduction_V2
{ {
static_assert(BlockSize == ThreadClusterLengths_M_K::At(0) * ThreadClusterLengths_M_K::At(1), static_assert(BlockSize == ThreadClusterLengths_M_K::At(0) * ThreadClusterLengths_M_K::At(1),
"The product of cluster lengths should be same as BlockSize!"); "The product of cluster lengths should be same as BlockSize!");
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment