Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
50876abc
Unverified
Commit
50876abc
authored
Jun 13, 2025
by
Jinn
Committed by
GitHub
Jun 13, 2025
Browse files
Add test for refactored openai server (#7161)
parent
b4c41f72
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
102 additions
and
0 deletions
+102
-0
test/srt/openai/conftest.py
test/srt/openai/conftest.py
+86
-0
test/srt/openai/test_server.py
test/srt/openai/test_server.py
+16
-0
No files found.
test/srt/openai/conftest.py
0 → 100644
View file @
50876abc
# sglang/test/srt/openai/conftest.py
import
os
import
socket
import
subprocess
import
sys
import
tempfile
import
time
from
contextlib
import
closing
from
typing
import
Generator
import
pytest
import
requests
from
sglang.srt.utils
import
kill_process_tree
# reuse SGLang helper
SERVER_MODULE
=
"sglang.srt.entrypoints.openai.api_server"
DEFAULT_MODEL
=
"dummy-model"
STARTUP_TIMEOUT
=
float
(
os
.
getenv
(
"SGLANG_OPENAI_STARTUP_TIMEOUT"
,
120
))
def
_pick_free_port
()
->
int
:
with
closing
(
socket
.
socket
())
as
s
:
s
.
bind
((
"127.0.0.1"
,
0
))
return
s
.
getsockname
()[
1
]
def
_wait_until_healthy
(
proc
:
subprocess
.
Popen
,
base
:
str
,
timeout
:
float
)
->
None
:
start
=
time
.
perf_counter
()
while
time
.
perf_counter
()
-
start
<
timeout
:
if
proc
.
poll
()
is
not
None
:
# crashed
raise
RuntimeError
(
"api_server terminated prematurely"
)
try
:
if
requests
.
get
(
f
"
{
base
}
/health"
,
timeout
=
1
).
status_code
==
200
:
return
except
requests
.
RequestException
:
pass
time
.
sleep
(
0.4
)
raise
RuntimeError
(
"api_server readiness probe timed out"
)
def
launch_openai_server
(
model
:
str
=
DEFAULT_MODEL
,
**
kw
):
"""Spawn the draft OpenAI-compatible server and wait until it’s ready."""
port
=
_pick_free_port
()
cmd
=
[
sys
.
executable
,
"-m"
,
SERVER_MODULE
,
"--model-path"
,
model
,
"--host"
,
"127.0.0.1"
,
"--port"
,
str
(
port
),
*
map
(
str
,
kw
.
get
(
"args"
,
[])),
]
env
=
{
**
os
.
environ
,
**
kw
.
get
(
"env"
,
{})}
# Write logs to a temp file so the child never blocks on a full pipe.
log_file
=
tempfile
.
NamedTemporaryFile
(
"w+"
,
delete
=
False
)
proc
=
subprocess
.
Popen
(
cmd
,
env
=
env
,
stdout
=
log_file
,
stderr
=
subprocess
.
STDOUT
,
text
=
True
,
)
base
=
f
"http://127.0.0.1:
{
port
}
"
try
:
_wait_until_healthy
(
proc
,
base
,
STARTUP_TIMEOUT
)
except
Exception
as
e
:
proc
.
terminate
()
proc
.
wait
(
5
)
log_file
.
seek
(
0
)
print
(
"
\n
--- api_server log ---
\n
"
,
log_file
.
read
(),
file
=
sys
.
stderr
)
raise
e
return
proc
,
base
,
log_file
@
pytest
.
fixture
(
scope
=
"session"
)
def
openai_server
()
->
Generator
[
str
,
None
,
None
]:
"""PyTest fixture that provides the server’s base URL and cleans up."""
proc
,
base
,
log_file
=
launch_openai_server
()
yield
base
kill_process_tree
(
proc
.
pid
)
log_file
.
close
()
test/srt/openai/test_server.py
0 → 100644
View file @
50876abc
# sglang/test/srt/openai/test_server.py
import
pytest
import
requests
def
test_health
(
openai_server
:
str
):
r
=
requests
.
get
(
f
"
{
openai_server
}
/health"
)
assert
r
.
status_code
==
200
,
r
.
text
assert
r
.
text
==
""
@
pytest
.
mark
.
xfail
(
reason
=
"Endpoint skeleton not implemented yet"
)
def
test_models_endpoint
(
openai_server
:
str
):
r
=
requests
.
get
(
f
"
{
openai_server
}
/v1/models"
)
# once implemented this should be 200
assert
r
.
status_code
==
200
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment