Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
DeepEP
Commits
ffc39ba0
"platforms/hip/tests/TestHipSort.cpp" did not exist on "644cc275ab5a549a82cce4d49680da729c2051e6"
Commit
ffc39ba0
authored
Mar 27, 2025
by
Chenggang Zhao
Browse files
Stronger acquire scope for low-latency kernels
parent
7d52ad72
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
2 additions
and
2 deletions
+2
-2
csrc/kernels/internode_ll.cu
csrc/kernels/internode_ll.cu
+2
-2
No files found.
csrc/kernels/internode_ll.cu
View file @
ffc39ba0
...
...
@@ -260,7 +260,7 @@ dispatch(void* packed_recv_x, float* packed_recv_x_scales,
int
num_recv_tokens
,
recv_token_begin_idx
;
EP_STATIC_ASSERT
(
kNumWarpsPerGroup
>
1
,
"Requires more than one warp per group"
);
if
(
sub_warp_id
==
1
and
lane_id
==
0
)
{
while
((
num_recv_tokens
=
ld_acquire_global
(
rdma_recv_count
+
local_expert_idx
*
num_ranks
+
src_rank
))
==
0
);
while
((
num_recv_tokens
=
ld_acquire_
sys_
global
(
rdma_recv_count
+
local_expert_idx
*
num_ranks
+
src_rank
))
==
0
);
num_recv_tokens
=
-
num_recv_tokens
-
1
;
recv_token_begin_idx
=
atomicAdd
(
packed_recv_count
+
local_expert_idx
,
num_recv_tokens
);
shared_num_recv_tokens
[
warp_group_id
]
=
num_recv_tokens
;
...
...
@@ -450,7 +450,7 @@ combine(void* combined_x,
if
(
responsible_expert_idx
<
num_experts
)
{
EP_STATIC_ASSERT
(
kNumWarpsPerGroup
>
1
,
"Invalid number of warps per group"
);
if
(
sub_warp_id
==
0
and
lane_id
==
0
)
while
(
ld_acquire_global
(
rdma_recv_flag
+
responsible_expert_idx
)
==
0
);
while
(
ld_acquire_
sys_
global
(
rdma_recv_flag
+
responsible_expert_idx
)
==
0
);
}
cg
::
this_grid
().
sync
();
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment