Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
7d911154
"sgl-router/git@developer.sourcefind.cn:change/sglang.git" did not exist on "9d68bdb240a5ba2713bd130f96e457f29fc7fba1"
Unverified
Commit
7d911154
authored
Oct 30, 2024
by
rocking
Committed by
GitHub
Oct 30, 2024
Browse files
clang-format (#1612)
parent
24d996aa
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
9 additions
and
9 deletions
+9
-9
include/ck_tile/ops/reduce/block/block_reduce.hpp
include/ck_tile/ops/reduce/block/block_reduce.hpp
+9
-9
No files found.
include/ck_tile/ops/reduce/block/block_reduce.hpp
View file @
7d911154
...
...
@@ -16,8 +16,8 @@ namespace ck_tile {
// synchronize reduce result (cross lane reduction and broadcast on replicated dimension)
template
<
typename
AccDistributedTensor_
,
typename
ReduceFunc
,
bool
WithBroadcast
=
true
>
CK_TILE_DEVICE
void
block_tile_reduce_sync
(
AccDistributedTensor_
&
acc_tensor
,
const
ReduceFunc
&
reduce_func
,
bool_constant
<
WithBroadcast
>
=
{})
const
ReduceFunc
&
reduce_func
,
bool_constant
<
WithBroadcast
>
=
{})
{
using
Dstr
=
typename
AccDistributedTensor_
::
StaticTileDistribution
;
using
DstrEncode
=
typename
Dstr
::
DstrEncode
;
...
...
@@ -116,7 +116,7 @@ CK_TILE_DEVICE void block_tile_reduce_sync(AccDistributedTensor_& acc_tensor,
*/
template
<
typename
AccDistributedTensor_
,
typename
ReduceFunc
>
CK_TILE_DEVICE
void
block_tile_reduce_xor_sync
(
AccDistributedTensor_
&
acc_tensor
,
const
ReduceFunc
&
reduce_func
)
const
ReduceFunc
&
reduce_func
)
{
using
Dstr
=
typename
AccDistributedTensor_
::
StaticTileDistribution
;
using
DstrEncode
=
typename
Dstr
::
DstrEncode
;
...
...
@@ -175,9 +175,9 @@ template <typename AccDistributedTensor_,
index_t
...
InReduceDims
,
typename
ReduceFunc
>
CK_TILE_DEVICE
void
block_tile_reduce
(
AccDistributedTensor_
&
acc_tensor
,
const
InDistributedTensor_
&
in_tensor
,
sequence
<
InReduceDims
...
>
,
const
ReduceFunc
&
reduce_func
)
const
InDistributedTensor_
&
in_tensor
,
sequence
<
InReduceDims
...
>
,
const
ReduceFunc
&
reduce_func
)
{
constexpr
auto
I0
=
number
<
0
>
{};
constexpr
auto
I1
=
number
<
1
>
{};
...
...
@@ -250,9 +250,9 @@ template <typename AccDataType_,
typename
ReduceFunc
,
typename
InDataType_
>
CK_TILE_DEVICE
auto
block_tile_reduce
(
const
InDistributedTensor_
&
in_tensor
,
sequence
<
InReduceDims
...
>
in_reduce_dims
,
const
ReduceFunc
&
reduce_func
,
const
InDataType_
&
reduce_init
)
sequence
<
InReduceDims
...
>
in_reduce_dims
,
const
ReduceFunc
&
reduce_func
,
const
InDataType_
&
reduce_init
)
{
using
InDataType
=
typename
InDistributedTensor_
::
DataType
;
using
AccDataType
=
remove_cvref_t
<
AccDataType_
>
;
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment