Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
fdc4e1e5
Unverified
Commit
fdc4e1e5
authored
Oct 03, 2025
by
fzyzcjy
Committed by
GitHub
Oct 03, 2025
Browse files
Tiny move files to utils folder (#11166)
parent
04b86b3c
Changes
66
Show whitespace changes
Inline
Side-by-side
Showing
6 changed files
with
19 additions
and
9 deletions
+19
-9
test/srt/test_patch_torch.py
test/srt/test_patch_torch.py
+1
-1
test/srt/test_sagemaker_server.py
test/srt/test_sagemaker_server.py
+1
-1
test/srt/test_session_control.py
test/srt/test_session_control.py
+1
-1
test/srt/test_srt_engine.py
test/srt/test_srt_engine.py
+1
-1
test/srt/test_tokenizer_batch_encode.py
test/srt/test_tokenizer_batch_encode.py
+3
-1
test/srt/test_tokenizer_manager.py
test/srt/test_tokenizer_manager.py
+12
-4
No files found.
test/srt/test_patch_torch.py
View file @
fdc4e1e5
...
@@ -6,7 +6,7 @@ from typing import Dict, List
...
@@ -6,7 +6,7 @@ from typing import Dict, List
import
torch
import
torch
import
torch.multiprocessing
as
mp
import
torch.multiprocessing
as
mp
from
sglang.srt.patch_torch
import
monkey_patch_torch_reductions
from
sglang.srt.
utils.
patch_torch
import
monkey_patch_torch_reductions
class
TestReleaseMemoryOccupation
(
unittest
.
TestCase
):
class
TestReleaseMemoryOccupation
(
unittest
.
TestCase
):
...
...
test/srt/test_sagemaker_server.py
View file @
fdc4e1e5
...
@@ -7,8 +7,8 @@ import unittest
...
@@ -7,8 +7,8 @@ import unittest
import
requests
import
requests
from
sglang.srt.hf_transformers_utils
import
get_tokenizer
from
sglang.srt.utils
import
kill_process_tree
from
sglang.srt.utils
import
kill_process_tree
from
sglang.srt.utils.hf_transformers_utils
import
get_tokenizer
from
sglang.test.test_utils
import
(
from
sglang.test.test_utils
import
(
DEFAULT_SMALL_MODEL_NAME_FOR_TEST
,
DEFAULT_SMALL_MODEL_NAME_FOR_TEST
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
...
...
test/srt/test_session_control.py
View file @
fdc4e1e5
...
@@ -13,8 +13,8 @@ import unittest
...
@@ -13,8 +13,8 @@ import unittest
import
aiohttp
import
aiohttp
import
requests
import
requests
from
sglang.srt.hf_transformers_utils
import
get_tokenizer
from
sglang.srt.utils
import
kill_process_tree
from
sglang.srt.utils
import
kill_process_tree
from
sglang.srt.utils.hf_transformers_utils
import
get_tokenizer
from
sglang.test.test_utils
import
(
from
sglang.test.test_utils
import
(
DEFAULT_SMALL_MODEL_NAME_FOR_TEST
,
DEFAULT_SMALL_MODEL_NAME_FOR_TEST
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
...
...
test/srt/test_srt_engine.py
View file @
fdc4e1e5
...
@@ -12,8 +12,8 @@ import torch
...
@@ -12,8 +12,8 @@ import torch
import
sglang
as
sgl
import
sglang
as
sgl
from
sglang.bench_offline_throughput
import
BenchArgs
,
throughput_test
from
sglang.bench_offline_throughput
import
BenchArgs
,
throughput_test
from
sglang.srt.hf_transformers_utils
import
get_tokenizer
from
sglang.srt.server_args
import
ServerArgs
from
sglang.srt.server_args
import
ServerArgs
from
sglang.srt.utils.hf_transformers_utils
import
get_tokenizer
from
sglang.test.few_shot_gsm8k_engine
import
run_eval
from
sglang.test.few_shot_gsm8k_engine
import
run_eval
from
sglang.test.test_utils
import
(
from
sglang.test.test_utils
import
(
DEFAULT_SMALL_EMBEDDING_MODEL_NAME_FOR_TEST
,
DEFAULT_SMALL_EMBEDDING_MODEL_NAME_FOR_TEST
,
...
...
test/srt/test_tokenizer_batch_encode.py
View file @
fdc4e1e5
...
@@ -34,7 +34,9 @@ class TestTokenizerBatchEncode(unittest.TestCase):
...
@@ -34,7 +34,9 @@ class TestTokenizerBatchEncode(unittest.TestCase):
with
patch
(
"zmq.asyncio.Context"
),
patch
(
with
patch
(
"zmq.asyncio.Context"
),
patch
(
"sglang.srt.utils.get_zmq_socket"
"sglang.srt.utils.get_zmq_socket"
),
patch
(
"sglang.srt.hf_transformers_utils.get_tokenizer"
)
as
mock_tokenizer
:
),
patch
(
"sglang.srt.utils.hf_transformers_utils.get_tokenizer"
)
as
mock_tokenizer
:
mock_tokenizer
.
return_value
=
Mock
(
vocab_size
=
32000
)
mock_tokenizer
.
return_value
=
Mock
(
vocab_size
=
32000
)
self
.
tokenizer_manager
=
TokenizerManager
(
self
.
server_args
,
self
.
port_args
)
self
.
tokenizer_manager
=
TokenizerManager
(
self
.
server_args
,
self
.
port_args
)
...
...
test/srt/test_tokenizer_manager.py
View file @
fdc4e1e5
...
@@ -31,7 +31,9 @@ class TestInputFormatDetection(unittest.TestCase):
...
@@ -31,7 +31,9 @@ class TestInputFormatDetection(unittest.TestCase):
with
patch
(
"zmq.asyncio.Context"
),
patch
(
with
patch
(
"zmq.asyncio.Context"
),
patch
(
"sglang.srt.utils.get_zmq_socket"
"sglang.srt.utils.get_zmq_socket"
),
patch
(
"sglang.srt.hf_transformers_utils.get_tokenizer"
)
as
mock_tokenizer
:
),
patch
(
"sglang.srt.utils.hf_transformers_utils.get_tokenizer"
)
as
mock_tokenizer
:
mock_tokenizer
.
return_value
=
Mock
(
vocab_size
=
32000
)
mock_tokenizer
.
return_value
=
Mock
(
vocab_size
=
32000
)
self
.
tokenizer_manager
=
TokenizerManager
(
self
.
server_args
,
self
.
port_args
)
self
.
tokenizer_manager
=
TokenizerManager
(
self
.
server_args
,
self
.
port_args
)
...
@@ -125,7 +127,9 @@ class TestTokenizerInputPreparation(unittest.TestCase):
...
@@ -125,7 +127,9 @@ class TestTokenizerInputPreparation(unittest.TestCase):
with
patch
(
"zmq.asyncio.Context"
),
patch
(
with
patch
(
"zmq.asyncio.Context"
),
patch
(
"sglang.srt.utils.get_zmq_socket"
"sglang.srt.utils.get_zmq_socket"
),
patch
(
"sglang.srt.hf_transformers_utils.get_tokenizer"
)
as
mock_tokenizer
:
),
patch
(
"sglang.srt.utils.hf_transformers_utils.get_tokenizer"
)
as
mock_tokenizer
:
mock_tokenizer
.
return_value
=
Mock
(
vocab_size
=
32000
)
mock_tokenizer
.
return_value
=
Mock
(
vocab_size
=
32000
)
self
.
tokenizer_manager
=
TokenizerManager
(
self
.
server_args
,
self
.
port_args
)
self
.
tokenizer_manager
=
TokenizerManager
(
self
.
server_args
,
self
.
port_args
)
...
@@ -177,7 +181,9 @@ class TestTokenizerResultExtraction(unittest.TestCase):
...
@@ -177,7 +181,9 @@ class TestTokenizerResultExtraction(unittest.TestCase):
with
patch
(
"zmq.asyncio.Context"
),
patch
(
with
patch
(
"zmq.asyncio.Context"
),
patch
(
"sglang.srt.utils.get_zmq_socket"
"sglang.srt.utils.get_zmq_socket"
),
patch
(
"sglang.srt.hf_transformers_utils.get_tokenizer"
)
as
mock_tokenizer
:
),
patch
(
"sglang.srt.utils.hf_transformers_utils.get_tokenizer"
)
as
mock_tokenizer
:
mock_tokenizer
.
return_value
=
Mock
(
vocab_size
=
32000
)
mock_tokenizer
.
return_value
=
Mock
(
vocab_size
=
32000
)
self
.
tokenizer_manager
=
TokenizerManager
(
self
.
server_args
,
self
.
port_args
)
self
.
tokenizer_manager
=
TokenizerManager
(
self
.
server_args
,
self
.
port_args
)
...
@@ -279,7 +285,9 @@ class TestTokenizerManagerIntegration(unittest.TestCase):
...
@@ -279,7 +285,9 @@ class TestTokenizerManagerIntegration(unittest.TestCase):
with
patch
(
"zmq.asyncio.Context"
),
patch
(
with
patch
(
"zmq.asyncio.Context"
),
patch
(
"sglang.srt.utils.get_zmq_socket"
"sglang.srt.utils.get_zmq_socket"
),
patch
(
"sglang.srt.hf_transformers_utils.get_tokenizer"
)
as
mock_tokenizer
:
),
patch
(
"sglang.srt.utils.hf_transformers_utils.get_tokenizer"
)
as
mock_tokenizer
:
mock_tokenizer
.
return_value
=
Mock
(
vocab_size
=
32000
)
mock_tokenizer
.
return_value
=
Mock
(
vocab_size
=
32000
)
self
.
tokenizer_manager
=
TokenizerManager
(
self
.
server_args
,
self
.
port_args
)
self
.
tokenizer_manager
=
TokenizerManager
(
self
.
server_args
,
self
.
port_args
)
...
...
Prev
1
2
3
4
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment