change name to PartitionedBlockwiseReduction_V2

cee2d38e · ltqin · 7a04ca2a · cee2d38e · cee2d38e
Commit cee2d38e authored Jul 28, 2022 by ltqin
2 changed files
--- a/include/ck/tensor_operation/gpu/block/blockwise_softmax_v1.hpp
+++ b/include/ck/tensor_operation/gpu/block/blockwise_softmax_v1.hpp
@@ -62,22 +62,22 @@ struct BlockwiseSoftmax_V1
    using ThreadClusterLengths_M_K = Sequence<MPerBlock, WaveSize / MPerXDL>;
    using BlockwiseMaxReduce =
-        PartitionedBlockwiseReduction2<AccDataType,
+        PartitionedBlockwiseReduction_V2<AccDataType,
-                                       BlockSize,
+                                         BlockSize,
-                                       ThreadClusterLengths_M_K,
+                                         ThreadClusterLengths_M_K,
-                                       BlockToMKMap_M0_K_M1Adapt,
+                                         BlockToMKMap_M0_K_M1Adapt,
-                                       reduce::Max,
+                                         reduce::Max,
-                                       false, // param ignored
+                                         false, // param ignored
-                                       detail::AccumulateWithNanIgnore<reduce::Max, AccDataType>>;
+                                         detail::AccumulateWithNanIgnore<reduce::Max, AccDataType>>;
    using BlockwiseSumReduce =
-        PartitionedBlockwiseReduction2<AccDataType,
+        PartitionedBlockwiseReduction_V2<AccDataType,
-                                       BlockSize,
+                                         BlockSize,
-                                       ThreadClusterLengths_M_K,
+                                         ThreadClusterLengths_M_K,
-                                       BlockToMKMap_M0_K_M1Adapt,
+                                         BlockToMKMap_M0_K_M1Adapt,
-                                       reduce::Add,
+                                         reduce::Add,
-                                       false, // ignored
+                                         false, // ignored
-                                       detail::AccumulateWithNanIgnore<reduce::Add, AccDataType>>;
+                                         detail::AccumulateWithNanIgnore<reduce::Add, AccDataType>>;
    using ThreadwiseSumReduce =
        ThreadwiseReduction<AccDataType,

--- a/include/ck/tensor_operation/gpu/block/reduction_functions_blockwise.hpp
+++ b/include/ck/tensor_operation/gpu/block/reduction_functions_blockwise.hpp
@@ -97,7 +97,7 @@ template <typename AccDataType,
          bool PropagateNan,
          typename Accumulation =
              detail::AccumulateWithNanCheck<PropagateNan, OpReduce, AccDataType>>
-struct PartitionedBlockwiseReduction2
+struct PartitionedBlockwiseReduction_V2
 {
    static_assert(BlockSize == ThreadClusterLengths_M_K::At(0) * ThreadClusterLengths_M_K::At(1),
                  "The product of cluster lengths should be same as BlockSize!");