Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
2c4f5cca
"tests/git@developer.sourcefind.cn:OpenDAS/deepspeed.git" did not exist on "871f3048ad0d05e79f8835849b7a00656a14b3f4"
Unverified
Commit
2c4f5cca
authored
Mar 15, 2025
by
Lianmin Zheng
Committed by
GitHub
Mar 15, 2025
Browse files
Fix minor style (#4460)
parent
15843047
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
7 additions
and
4 deletions
+7
-4
python/sglang/srt/mem_cache/memory_pool.py
python/sglang/srt/mem_cache/memory_pool.py
+1
-0
python/sglang/srt/utils.py
python/sglang/srt/utils.py
+5
-3
test/srt/test_eval_fp8_accuracy.py
test/srt/test_eval_fp8_accuracy.py
+1
-1
No files found.
python/sglang/srt/mem_cache/memory_pool.py
View file @
2c4f5cca
...
@@ -340,6 +340,7 @@ class MHATokenToKVPool(KVCache):
...
@@ -340,6 +340,7 @@ class MHATokenToKVPool(KVCache):
cache_v
=
cache_v
.
view
(
self
.
store_dtype
)
cache_v
=
cache_v
.
view
(
self
.
store_dtype
)
if
self
.
capture_mode
and
cache_k
.
shape
[
0
]
<
4
:
if
self
.
capture_mode
and
cache_k
.
shape
[
0
]
<
4
:
# Overlap the copy of K and V cache for small batch size
current_stream
=
self
.
device_module
.
current_stream
()
current_stream
=
self
.
device_module
.
current_stream
()
self
.
alt_stream
.
wait_stream
(
current_stream
)
self
.
alt_stream
.
wait_stream
(
current_stream
)
with
self
.
device_module
.
stream
(
self
.
alt_stream
):
with
self
.
device_module
.
stream
(
self
.
alt_stream
):
...
...
python/sglang/srt/utils.py
View file @
2c4f5cca
...
@@ -481,6 +481,7 @@ def suppress_other_loggers():
...
@@ -481,6 +481,7 @@ def suppress_other_loggers():
logging
.
getLogger
(
"vllm.distributed.device_communicators.shm_broadcast"
).
setLevel
(
logging
.
getLogger
(
"vllm.distributed.device_communicators.shm_broadcast"
).
setLevel
(
logging
.
WARN
logging
.
WARN
)
)
logging
.
getLogger
(
"vllm.config"
).
setLevel
(
logging
.
ERROR
)
warnings
.
filterwarnings
(
warnings
.
filterwarnings
(
"ignore"
,
category
=
UserWarning
,
message
=
"The given NumPy array is not writable"
"ignore"
,
category
=
UserWarning
,
message
=
"The given NumPy array is not writable"
...
@@ -527,10 +528,11 @@ def kill_process_tree(parent_pid, include_parent: bool = True, skip_pid: int = N
...
@@ -527,10 +528,11 @@ def kill_process_tree(parent_pid, include_parent: bool = True, skip_pid: int = N
pass
pass
if
include_parent
:
if
include_parent
:
if
parent_pid
==
os
.
getpid
():
sys
.
exit
(
0
)
try
:
try
:
if
parent_pid
==
os
.
getpid
():
itself
.
kill
()
sys
.
exit
(
0
)
itself
.
kill
()
itself
.
kill
()
# Sometime processes cannot be killed with SIGKILL (e.g, PID=1 launched by kubernetes),
# Sometime processes cannot be killed with SIGKILL (e.g, PID=1 launched by kubernetes),
...
...
test/srt/test_eval_fp8_accuracy.py
View file @
2c4f5cca
...
@@ -36,7 +36,7 @@ class TestEvalFP8Accuracy(unittest.TestCase):
...
@@ -36,7 +36,7 @@ class TestEvalFP8Accuracy(unittest.TestCase):
)
)
metrics
=
run_eval
(
args
)
metrics
=
run_eval
(
args
)
self
.
assertGreaterEqual
(
metrics
[
"score"
],
0.6
2
)
self
.
assertGreaterEqual
(
metrics
[
"score"
],
0.6
1
)
class
TestEvalFP8DynamicQuantAccuracy
(
unittest
.
TestCase
):
class
TestEvalFP8DynamicQuantAccuracy
(
unittest
.
TestCase
):
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment