Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
66b809cc
Commit
66b809cc
authored
Feb 08, 2025
by
zhuwenwen
Browse files
Merge tag 'v0.7.2' into v0.7.2-dev
parents
37b63c24
0408efc6
Changes
1000
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
63 additions
and
0 deletions
+63
-0
tests/kernels/test_moe.py
tests/kernels/test_moe.py
+1
-0
tests/kernels/test_pos_encoding.py
tests/kernels/test_pos_encoding.py
+2
-0
tests/kernels/test_prefix_prefill.py
tests/kernels/test_prefix_prefill.py
+2
-0
tests/kernels/test_rocm_attention_selector.py
tests/kernels/test_rocm_attention_selector.py
+31
-0
tests/kernels/test_rotary_embedding.py
tests/kernels/test_rotary_embedding.py
+1
-0
tests/kernels/test_triton_decode_attention.py
tests/kernels/test_triton_decode_attention.py
+2
-0
tests/kernels/test_triton_scaled_mm.py
tests/kernels/test_triton_scaled_mm.py
+1
-0
tests/kernels/test_utils.py
tests/kernels/test_utils.py
+1
-0
tests/kernels/untest_aqlm.py
tests/kernels/untest_aqlm.py
+2
-0
tests/kernels/untest_awq.py
tests/kernels/untest_awq.py
+2
-0
tests/kernels/untest_causal_conv1d.py
tests/kernels/untest_causal_conv1d.py
+2
-0
tests/kernels/untest_flashinfer.py
tests/kernels/untest_flashinfer.py
+2
-0
tests/kernels/untest_fp8_quant.py
tests/kernels/untest_fp8_quant.py
+2
-0
tests/kernels/untest_ggml.py
tests/kernels/untest_ggml.py
+2
-0
tests/kernels/untest_gptq.py
tests/kernels/untest_gptq.py
+2
-0
tests/kernels/untest_mamba_ssm.py
tests/kernels/untest_mamba_ssm.py
+2
-0
tests/kernels/untest_marlin_gemm.py
tests/kernels/untest_marlin_gemm.py
+1
-0
tests/kernels/untest_permute_cols.py
tests/kernels/untest_permute_cols.py
+2
-0
tests/kernels/utils.py
tests/kernels/utils.py
+1
-0
tests/kv_transfer/disagg_test.py
tests/kv_transfer/disagg_test.py
+2
-0
No files found.
Too many changes to show.
To preserve performance only
1000 of 1000+
files are displayed.
Plain diff
Email patch
tests/kernels/test_moe.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
"""Tests for the MOE layers.
Run `pytest tests/kernels/test_moe.py`.
...
...
tests/kernels/test_pos_encoding.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
from
itertools
import
accumulate
,
product
from
typing
import
Dict
,
List
,
Optional
...
...
tests/kernels/test_prefix_prefill.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
math
import
random
import
time
...
...
tests/kernels/test_rocm_attention_selector.py
0 → 100644
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
from
unittest.mock
import
patch
import
pytest
import
torch
from
tests.kernels.utils
import
override_backend_env_variable
from
vllm.attention.selector
import
_cached_get_attn_backend
,
get_attn_backend
from
vllm.platforms.rocm
import
RocmPlatform
@
pytest
.
fixture
(
autouse
=
True
)
def
clear_cache
():
"""Clear lru cache to ensure each test case runs without caching.
"""
_cached_get_attn_backend
.
cache_clear
()
def
test_selector
(
monkeypatch
):
"""Test that the attention selector for ROCm.
"""
override_backend_env_variable
(
monkeypatch
,
"ROCM_FLASH"
)
with
patch
(
"vllm.attention.selector.current_platform"
,
RocmPlatform
()):
backend
=
get_attn_backend
(
16
,
torch
.
float16
,
torch
.
float16
,
16
,
False
)
assert
backend
.
get_name
()
==
"ROCM_FLASH"
# mla test for deepseek related
backend
=
get_attn_backend
(
576
,
torch
.
bfloat16
,
"auto"
,
16
,
False
,
False
,
True
)
assert
backend
.
get_name
()
==
"TRITON_MLA"
tests/kernels/test_rotary_embedding.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
"""
Tests for miscellaneous utilities
"""
...
...
tests/kernels/test_triton_decode_attention.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
pytest
import
torch
...
...
tests/kernels/test_triton_scaled_mm.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
"""Tests for the triton_scaled_mm kernel
Run `pytest tests/kernels/test_triton_scaled_mm.py`.
...
...
tests/kernels/test_utils.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
"""
Tests for miscellaneous utilities
"""
...
...
tests/kernels/untest_aqlm.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
torch
from
tests.kernels.utils
import
opcheck
...
...
tests/kernels/untest_awq.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
os
import
pytest
...
...
tests/kernels/untest_causal_conv1d.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
from
typing
import
Optional
import
pytest
...
...
tests/kernels/untest_flashinfer.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
from
typing
import
List
,
Optional
,
Tuple
import
flashinfer
...
...
tests/kernels/untest_fp8_quant.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
pytest
import
torch
...
...
tests/kernels/untest_ggml.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
gguf
import
pytest
import
torch
...
...
tests/kernels/untest_gptq.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
torch
from
tests.kernels.utils
import
opcheck
...
...
tests/kernels/untest_mamba_ssm.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
pytest
import
torch
import
torch.nn.functional
as
F
...
...
tests/kernels/untest_marlin_gemm.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
"""Tests for the marlin kernel.
Run `pytest tests/kernels/marlin/test_marlin_gemm.py`.
...
...
tests/kernels/untest_permute_cols.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
pytest
import
torch
...
...
tests/kernels/utils.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
"""Kernel test utils"""
import
itertools
...
...
tests/kv_transfer/disagg_test.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
os
import
subprocess
import
sys
...
...
Prev
1
…
10
11
12
13
14
15
16
17
18
…
50
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment