Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
DeepEP
Commits
079c5a4f
"examples/cpp-examples/CMakeLists.txt" did not exist on "3eff31f28b17914bf8fe1fe8a226d09cba60b82f"
Commit
079c5a4f
authored
Jul 14, 2025
by
Shangyan Zhou
Browse files
Fix
parent
eb155da4
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
6 additions
and
12 deletions
+6
-12
csrc/kernels/internode.cu
csrc/kernels/internode.cu
+6
-12
No files found.
csrc/kernels/internode.cu
View file @
079c5a4f
...
...
@@ -1048,23 +1048,17 @@ __global__ void cached_notify(const int rdma_clean_offset, const int rdma_num_in
// Using two SMs, which clean the RDMA/NVL buffer respectively
if
(
sm_id
==
0
)
{
// Barrier for RDMA
if
(
thread_id
==
0
)
if
(
thread_id
==
32
)
nvshmem_sync_with_same_gpu_idx
<
kLowLatencyMode
>
(
rdma_team
);
__syncthreads
();
// Barrier for NVL
barrier_block
<
NUM_MAX_NVL_PEERS
,
true
>
(
barrier_signal_ptrs
,
nvl_rank
);
// Clean RDMA buffer
auto
rdma_buffer_ptr_int
=
static_cast
<
int
*>
(
rdma_buffer_ptr
);
#pragma unroll
for
(
int
i
=
thread_id
;
i
<
rdma_num_int_clean
;
i
+=
num_threads
)
rdma_buffer_ptr_int
[
rdma_clean_offset
+
i
]
=
0
;
__syncthreads
();
// Barrier again
if
(
thread_id
==
0
)
nvshmem_sync_with_same_gpu_idx
<
kLowLatencyMode
>
(
rdma_team
);
}
else
if
(
sm_id
==
1
)
{
// Barrier for NVL
barrier_block
<
NUM_MAX_NVL_PEERS
,
true
>
(
barrier_signal_ptrs
,
nvl_rank
);
// Clean NVL buffer
auto
nvl_buffer_ptr_int
=
static_cast
<
int
*>
(
buffer_ptrs
[
nvl_rank
]);
...
...
@@ -1074,8 +1068,8 @@ __global__ void cached_notify(const int rdma_clean_offset, const int rdma_num_in
__syncthreads
();
// Barrier again
if
(
warp
_id
==
1
)
nvshmem_sync_with_same_gpu_idx
_warp
<
kLowLatencyMode
>
(
rdma_team
,
rank
,
lane_id
);
if
(
thread
_id
==
32
)
nvshmem_sync_with_same_gpu_idx
<
kLowLatencyMode
>
(
rdma_team
);
barrier_block
<
NUM_MAX_NVL_PEERS
>
(
barrier_signal_ptrs
,
nvl_rank
);
}
else
if
(
sm_id
==
1
)
{
if
(
is_cached_dispatch
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment