Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
DeepEP
Commits
1d3963d2
Commit
1d3963d2
authored
Sep 11, 2025
by
Shangyan Zhou
Browse files
Fix bar.sync
parent
ef70b83e
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
4 additions
and
4 deletions
+4
-4
csrc/kernels/internode.cu
csrc/kernels/internode.cu
+4
-4
No files found.
csrc/kernels/internode.cu
View file @
1d3963d2
...
...
@@ -439,7 +439,7 @@ dispatch(int4* recv_x, float* recv_x_scales, int64_t* recv_topk_idx, float* recv
__shared__
int
rdma_send_channel_lock
[
kNumRDMARanks
];
__shared__
int
rdma_send_channel_tail
[
kNumRDMARanks
];
__shared__
uint32_t
rdma_send_channel_window
[
kNumRDMARanks
];
auto
sync_rdma_sender_smem
=
[]()
{
asm
volatile
(
"bar.sync 0, %0;"
::
"r"
((
kNumDispatchRDMASenderWarps
+
1
)
*
32
));
};
auto
sync_rdma_sender_smem
=
[]()
{
asm
volatile
(
"bar
rier
.sync 0, %0;"
::
"r"
((
kNumDispatchRDMASenderWarps
+
1
)
*
32
));
};
// TMA stuffs
extern
__shared__
__align__
(
1024
)
uint8_t
smem_tma_buffer
[];
...
...
@@ -457,7 +457,7 @@ dispatch(int4* recv_x, float* recv_x_scales, int64_t* recv_topk_idx, float* recv
// Forward warp synchronization
__shared__
volatile
int
forward_channel_head
[
NUM_MAX_NVL_PEERS
][
kNumRDMARanks
];
__shared__
volatile
bool
forward_channel_retired
[
NUM_MAX_NVL_PEERS
];
auto
sync_forwarder_smem
=
[]()
{
asm
volatile
(
"bar.sync 1, %0;"
::
"r"
((
NUM_MAX_NVL_PEERS
+
1
)
*
32
));
};
auto
sync_forwarder_smem
=
[]()
{
asm
volatile
(
"bar
rier
.sync 1, %0;"
::
"r"
((
NUM_MAX_NVL_PEERS
+
1
)
*
32
));
};
if
(
warp_role
==
WarpRole
::
kRDMASender
)
{
// Get tasks
...
...
@@ -1567,8 +1567,8 @@ combine(int4* combined_x, float* combined_topk_weights,
__shared__
volatile
bool
forwarder_retired
[
kNumForwarders
];
__shared__
volatile
int
rdma_receiver_rdma_head
[
kNumRDMAReceivers
][
kNumRDMARanks
];
__shared__
volatile
bool
rdma_receiver_retired
[
kNumRDMAReceivers
];
auto
sync_forwarder_smem
=
[
=
]()
{
asm
volatile
(
"bar.sync 0, %0;"
::
"r"
((
kNumForwarders
+
1
)
*
32
));
};
auto
sync_rdma_receiver_smem
=
[
=
]()
{
asm
volatile
(
"bar.sync 1, %0;"
::
"r"
((
kNumRDMAReceivers
+
1
)
*
32
));
};
auto
sync_forwarder_smem
=
[
=
]()
{
asm
volatile
(
"bar
rier
.sync 0, %0;"
::
"r"
((
kNumForwarders
+
1
)
*
32
));
};
auto
sync_rdma_receiver_smem
=
[
=
]()
{
asm
volatile
(
"bar
rier
.sync 1, %0;"
::
"r"
((
kNumRDMAReceivers
+
1
)
*
32
));
};
if
(
warp_role
==
WarpRole
::
kNVLAndRDMAForwarder
)
{
// Receive from NVL ranks and forward to RDMA ranks
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment