Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
fff7fbab
Unverified
Commit
fff7fbab
authored
Sep 27, 2025
by
Mick
Committed by
GitHub
Sep 26, 2025
Browse files
ci: fix rate-limit of huggingface with hf auth login (#10947)
parent
aae7ead2
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
35 additions
and
3 deletions
+35
-3
.github/workflows/pr-test.yml
.github/workflows/pr-test.yml
+26
-0
scripts/ci/ci_install_dependency.sh
scripts/ci/ci_install_dependency.sh
+6
-0
test/srt/run_suite.py
test/srt/run_suite.py
+3
-3
No files found.
.github/workflows/pr-test.yml
View file @
fff7fbab
...
@@ -103,6 +103,8 @@ jobs:
...
@@ -103,6 +103,8 @@ jobs:
needs
:
[
check-changes
,
sgl-kernel-build-wheels
]
needs
:
[
check-changes
,
sgl-kernel-build-wheels
]
if
:
needs.check-changes.outputs.sgl_kernel == 'true'
if
:
needs.check-changes.outputs.sgl_kernel == 'true'
runs-on
:
1-gpu-runner
runs-on
:
1-gpu-runner
env
:
HF_TOKEN
:
${{ secrets.HF_TOKEN }}
steps
:
steps
:
-
uses
:
actions/checkout@v4
-
uses
:
actions/checkout@v4
...
@@ -191,6 +193,8 @@ jobs:
...
@@ -191,6 +193,8 @@ jobs:
if
:
always() && !failure() && !cancelled() &&
if
:
always() && !failure() && !cancelled() &&
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
runs-on
:
1-gpu-runner
runs-on
:
1-gpu-runner
env
:
HF_TOKEN
:
${{ secrets.HF_TOKEN }}
strategy
:
strategy
:
fail-fast
:
false
fail-fast
:
false
matrix
:
matrix
:
...
@@ -222,6 +226,8 @@ jobs:
...
@@ -222,6 +226,8 @@ jobs:
if
:
always() && !failure() && !cancelled() &&
if
:
always() && !failure() && !cancelled() &&
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
runs-on
:
2-gpu-runner
runs-on
:
2-gpu-runner
env
:
HF_TOKEN
:
${{ secrets.HF_TOKEN }}
strategy
:
strategy
:
fail-fast
:
false
fail-fast
:
false
matrix
:
matrix
:
...
@@ -253,6 +259,8 @@ jobs:
...
@@ -253,6 +259,8 @@ jobs:
if
:
always() && !failure() && !cancelled() &&
if
:
always() && !failure() && !cancelled() &&
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
runs-on
:
4-gpu-runner
runs-on
:
4-gpu-runner
env
:
HF_TOKEN
:
${{ secrets.HF_TOKEN }}
strategy
:
strategy
:
fail-fast
:
false
fail-fast
:
false
matrix
:
matrix
:
...
@@ -284,6 +292,8 @@ jobs:
...
@@ -284,6 +292,8 @@ jobs:
if
:
always() && !failure() && !cancelled() &&
if
:
always() && !failure() && !cancelled() &&
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
runs-on
:
8-gpu-runner
runs-on
:
8-gpu-runner
env
:
HF_TOKEN
:
${{ secrets.HF_TOKEN }}
strategy
:
strategy
:
fail-fast
:
false
fail-fast
:
false
matrix
:
matrix
:
...
@@ -315,6 +325,8 @@ jobs:
...
@@ -315,6 +325,8 @@ jobs:
if
:
always() && !failure() && !cancelled() &&
if
:
always() && !failure() && !cancelled() &&
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
runs-on
:
1-gpu-runner
runs-on
:
1-gpu-runner
env
:
HF_TOKEN
:
${{ secrets.HF_TOKEN }}
steps
:
steps
:
-
name
:
Checkout code
-
name
:
Checkout code
uses
:
actions/checkout@v4
uses
:
actions/checkout@v4
...
@@ -374,6 +386,8 @@ jobs:
...
@@ -374,6 +386,8 @@ jobs:
if
:
always() && !failure() && !cancelled() &&
if
:
always() && !failure() && !cancelled() &&
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
runs-on
:
1-gpu-runner
runs-on
:
1-gpu-runner
env
:
HF_TOKEN
:
${{ secrets.HF_TOKEN }}
steps
:
steps
:
-
name
:
Checkout code
-
name
:
Checkout code
uses
:
actions/checkout@v4
uses
:
actions/checkout@v4
...
@@ -425,6 +439,8 @@ jobs:
...
@@ -425,6 +439,8 @@ jobs:
if
:
always() && !failure() && !cancelled() &&
if
:
always() && !failure() && !cancelled() &&
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
runs-on
:
2-gpu-runner
runs-on
:
2-gpu-runner
env
:
HF_TOKEN
:
${{ secrets.HF_TOKEN }}
steps
:
steps
:
-
name
:
Checkout code
-
name
:
Checkout code
uses
:
actions/checkout@v4
uses
:
actions/checkout@v4
...
@@ -482,6 +498,8 @@ jobs:
...
@@ -482,6 +498,8 @@ jobs:
if
:
always() && !failure() && !cancelled() &&
if
:
always() && !failure() && !cancelled() &&
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
runs-on
:
1-gpu-runner
runs-on
:
1-gpu-runner
env
:
HF_TOKEN
:
${{ secrets.HF_TOKEN }}
steps
:
steps
:
-
name
:
Checkout code
-
name
:
Checkout code
uses
:
actions/checkout@v4
uses
:
actions/checkout@v4
...
@@ -512,6 +530,8 @@ jobs:
...
@@ -512,6 +530,8 @@ jobs:
if
:
always() && !failure() && !cancelled() &&
if
:
always() && !failure() && !cancelled() &&
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
runs-on
:
2-gpu-runner
runs-on
:
2-gpu-runner
env
:
HF_TOKEN
:
${{ secrets.HF_TOKEN }}
steps
:
steps
:
-
name
:
Checkout code
-
name
:
Checkout code
uses
:
actions/checkout@v4
uses
:
actions/checkout@v4
...
@@ -542,6 +562,8 @@ jobs:
...
@@ -542,6 +562,8 @@ jobs:
if
:
always() && !failure() && !cancelled() &&
if
:
always() && !failure() && !cancelled() &&
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
runs-on
:
4-gpu-runner
runs-on
:
4-gpu-runner
env
:
HF_TOKEN
:
${{ secrets.HF_TOKEN }}
steps
:
steps
:
-
name
:
Checkout code
-
name
:
Checkout code
uses
:
actions/checkout@v4
uses
:
actions/checkout@v4
...
@@ -569,6 +591,8 @@ jobs:
...
@@ -569,6 +591,8 @@ jobs:
if
:
always() && !failure() && !cancelled() &&
if
:
always() && !failure() && !cancelled() &&
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
runs-on
:
8-gpu-runner
runs-on
:
8-gpu-runner
env
:
HF_TOKEN
:
${{ secrets.HF_TOKEN }}
steps
:
steps
:
-
name
:
Checkout code
-
name
:
Checkout code
uses
:
actions/checkout@v4
uses
:
actions/checkout@v4
...
@@ -596,6 +620,8 @@ jobs:
...
@@ -596,6 +620,8 @@ jobs:
if
:
always() && !failure() && !cancelled() &&
if
:
always() && !failure() && !cancelled() &&
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
((needs.check-changes.outputs.main_package == 'true') || (needs.check-changes.outputs.sgl_kernel == 'true'))
runs-on
:
4-b200-runner
runs-on
:
4-b200-runner
env
:
HF_TOKEN
:
${{ secrets.HF_TOKEN }}
strategy
:
strategy
:
fail-fast
:
false
fail-fast
:
false
steps
:
steps
:
...
...
scripts/ci/ci_install_dependency.sh
View file @
fff7fbab
...
@@ -91,3 +91,9 @@ fi
...
@@ -91,3 +91,9 @@ fi
# Show current packages
# Show current packages
$PIP_CMD
list
$PIP_CMD
list
if
[
-n
"
${
HF_TOKEN
:-}
"
]
;
then
$PIP_CMD
install
-U
"huggingface_hub[cli]"
$PIP_INSTALL_SUFFIX
hf auth login
--token
$HF_TOKEN
fi
test/srt/run_suite.py
View file @
fff7fbab
...
@@ -35,7 +35,7 @@ suites = {
...
@@ -35,7 +35,7 @@ suites = {
# TestFile("models/test_grok_models.py", 60), # Disabled due to illegal memory access
# TestFile("models/test_grok_models.py", 60), # Disabled due to illegal memory access
TestFile
(
"models/test_qwen_models.py"
,
82
),
TestFile
(
"models/test_qwen_models.py"
,
82
),
TestFile
(
"models/test_reward_models.py"
,
132
),
TestFile
(
"models/test_reward_models.py"
,
132
),
TestFile
(
"models/test_vlm_models.py"
,
437
),
TestFile
(
"models/test_vlm_models.py"
,
741
),
TestFile
(
"models/test_transformers_models.py"
,
320
),
TestFile
(
"models/test_transformers_models.py"
,
320
),
TestFile
(
"openai_server/basic/test_protocol.py"
,
10
),
TestFile
(
"openai_server/basic/test_protocol.py"
,
10
),
TestFile
(
"openai_server/basic/test_serving_chat.py"
,
10
),
TestFile
(
"openai_server/basic/test_serving_chat.py"
,
10
),
...
@@ -93,7 +93,7 @@ suites = {
...
@@ -93,7 +93,7 @@ suites = {
TestFile
(
"test_multi_tokenizer.py"
,
230
),
TestFile
(
"test_multi_tokenizer.py"
,
230
),
TestFile
(
"test_no_chunked_prefill.py"
,
108
),
TestFile
(
"test_no_chunked_prefill.py"
,
108
),
TestFile
(
"test_no_overlap_scheduler.py"
,
234
),
TestFile
(
"test_no_overlap_scheduler.py"
,
234
),
TestFile
(
"test_original_logprobs.py"
,
200
),
TestFile
(
"test_original_logprobs.py"
,
41
),
TestFile
(
"test_penalty.py"
,
41
),
TestFile
(
"test_penalty.py"
,
41
),
TestFile
(
"test_page_size.py"
,
60
),
TestFile
(
"test_page_size.py"
,
60
),
TestFile
(
"test_priority_scheduling.py"
,
100
),
TestFile
(
"test_priority_scheduling.py"
,
100
),
...
@@ -244,7 +244,7 @@ suite_amd = {
...
@@ -244,7 +244,7 @@ suite_amd = {
TestFile
(
"test_skip_tokenizer_init.py"
,
117
),
TestFile
(
"test_skip_tokenizer_init.py"
,
117
),
TestFile
(
"test_srt_engine.py"
,
261
),
TestFile
(
"test_srt_engine.py"
,
261
),
TestFile
(
"test_srt_endpoint.py"
,
130
),
TestFile
(
"test_srt_endpoint.py"
,
130
),
TestFile
(
"test_torch_compile.py"
,
76
),
TestFile
(
"test_torch_compile.py"
,
169
),
TestFile
(
"test_torch_compile_moe.py"
,
172
),
TestFile
(
"test_torch_compile_moe.py"
,
172
),
TestFile
(
"test_torch_native_attention_backend.py"
,
123
),
TestFile
(
"test_torch_native_attention_backend.py"
,
123
),
TestFile
(
"test_triton_attention_backend.py"
,
150
),
TestFile
(
"test_triton_attention_backend.py"
,
150
),
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment