Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
DeepEP
Commits
8dcdd349
Unverified
Commit
8dcdd349
authored
Jul 02, 2025
by
fzyzcjy
Committed by
GitHub
Jul 02, 2025
Browse files
cherry pick (#251)
parent
19fc0700
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
15 additions
and
3 deletions
+15
-3
tests/test_internode.py
tests/test_internode.py
+6
-1
tests/test_intranode.py
tests/test_intranode.py
+5
-1
tests/test_low_latency.py
tests/test_low_latency.py
+4
-1
No files found.
tests/test_internode.py
View file @
8dcdd349
...
...
@@ -13,7 +13,12 @@ import test_low_latency
def
test_main
(
num_sms
:
int
,
local_rank
:
int
,
num_local_ranks
:
int
,
num_ranks
:
int
,
num_nodes
:
int
,
rank
:
int
,
buffer
:
deep_ep
.
Buffer
,
group
:
dist
.
ProcessGroup
):
# Settings
num_tokens
,
hidden
,
num_topk_groups
,
num_topk
,
num_experts
=
4096
,
7168
,
min
(
num_nodes
,
4
),
8
,
(
256
//
num_ranks
)
*
num_ranks
num_tokens
=
int
(
os
.
environ
.
get
(
"DEEPEP_TEST_NUM_TOKENS"
,
"4096"
))
hidden
=
int
(
os
.
environ
.
get
(
"DEEPEP_TEST_HIDDEN"
,
"7168"
))
num_topk_groups
=
int
(
os
.
environ
.
get
(
"DEEPEP_TEST_NUM_TOPK_GROUPS"
,
str
(
min
(
num_nodes
,
4
))))
num_topk
=
int
(
os
.
environ
.
get
(
"DEEPEP_TEST_NUM_TOPK"
,
"8"
))
num_experts
=
int
(
os
.
environ
.
get
(
"DEEPEP_TEST_NUM_EXPERTS"
,
str
((
256
//
num_ranks
)
*
num_ranks
)))
assert
num_experts
%
num_ranks
==
0
and
num_local_ranks
==
8
if
local_rank
==
0
:
print
(
f
'[config] num_tokens=
{
num_tokens
}
, hidden=
{
hidden
}
, num_topk_groups=
{
num_topk_groups
}
, num_topk=
{
num_topk
}
'
,
flush
=
True
)
...
...
tests/test_intranode.py
View file @
8dcdd349
...
...
@@ -13,7 +13,11 @@ import test_low_latency
def
test_main
(
num_sms
:
int
,
local_rank
:
int
,
num_ranks
:
int
,
rank
:
int
,
buffer
:
deep_ep
.
Buffer
,
group
:
dist
.
ProcessGroup
):
# Settings
num_tokens
,
hidden
,
num_topk
,
num_experts
=
4096
,
7168
,
8
,
(
256
//
num_ranks
)
*
num_ranks
num_tokens
=
int
(
os
.
environ
.
get
(
"DEEPEP_TEST_NUM_TOKENS"
,
"4096"
))
hidden
=
int
(
os
.
environ
.
get
(
"DEEPEP_TEST_HIDDEN"
,
"7168"
))
num_topk
=
int
(
os
.
environ
.
get
(
"DEEPEP_TEST_NUM_TOPK"
,
"8"
))
num_experts
=
int
(
os
.
environ
.
get
(
"DEEPEP_TEST_NUM_EXPERTS"
,
str
((
256
//
num_ranks
)
*
num_ranks
)))
assert
num_experts
%
num_ranks
==
0
if
local_rank
==
0
:
print
(
f
'[config] num_tokens=
{
num_tokens
}
, hidden=
{
hidden
}
, num_topk=
{
num_topk
}
'
,
flush
=
True
)
...
...
tests/test_low_latency.py
View file @
8dcdd349
...
...
@@ -160,7 +160,10 @@ def test_main(num_tokens: int, hidden: int, num_experts: int, num_topk: int,
# noinspection PyUnboundLocalVariable
def
test_loop
(
local_rank
:
int
,
num_local_ranks
:
int
):
rank
,
num_ranks
,
group
=
init_dist
(
local_rank
,
num_local_ranks
)
num_tokens
,
hidden
,
num_topk
,
num_experts
=
128
,
7168
,
8
,
288
num_tokens
=
int
(
os
.
environ
.
get
(
"DEEPEP_TEST_NUM_TOKENS"
,
"128"
))
hidden
=
int
(
os
.
environ
.
get
(
"DEEPEP_TEST_HIDDEN"
,
"7168"
))
num_topk
=
int
(
os
.
environ
.
get
(
"DEEPEP_TEST_NUM_TOPK"
,
"8"
))
num_experts
=
int
(
os
.
environ
.
get
(
"DEEPEP_TEST_NUM_EXPERTS"
,
"288"
))
num_rdma_bytes
=
deep_ep
.
Buffer
.
get_low_latency_rdma_size_hint
(
num_tokens
,
hidden
,
num_ranks
,
num_experts
)
if
local_rank
==
0
:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment