Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
2d8b3257
Commit
2d8b3257
authored
Jan 28, 2026
by
zhuwenwen
Browse files
修复了awq的shape的bug,以及兼容了lmslim注册导入的的情况
parent
d76fc11e
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
6 additions
and
2 deletions
+6
-2
vllm/model_executor/layers/quantization/awq.py
vllm/model_executor/layers/quantization/awq.py
+4
-1
vllm/platforms/rocm.py
vllm/platforms/rocm.py
+1
-1
vllm/utils/__init__.py
vllm/utils/__init__.py
+1
-0
No files found.
vllm/model_executor/layers/quantization/awq.py
View file @
2d8b3257
...
...
@@ -34,6 +34,9 @@ if TYPE_CHECKING:
from
vllm.model_executor.layers.quantization.awq_triton
import
awq_gemm_triton
triton_configs_dict
=
{}
def
is_layer_skipped_awq
(
prefix
:
str
,
modules_to_not_convert
:
list
[
str
]):
return
any
(
module_name
in
prefix
for
module_name
in
modules_to_not_convert
)
def
get_triton_cache
(
file_path
):
#会将所报错的json文件以字典的形式return出来
...
...
@@ -377,7 +380,7 @@ class AWQLinearMethod(LinearMethodBase):
qzeros
=
layer
.
qzeros
scales
=
layer
.
scales
pack_factor
=
self
.
quant_config
.
pack_factor
out_shape
=
x
.
shape
[:
-
1
]
+
(
qweight
.
shape
[
-
1
]
*
pack_factor
,
)
out_shape
=
(
x
.
shape
[:
-
1
]
+
(
qweight
.
shape
[
0
]
*
1
,
)
)
reshaped_x
=
x
.
reshape
(
-
1
,
x
.
shape
[
-
1
])
m
=
reshaped_x
.
shape
[
0
]
...
...
vllm/platforms/rocm.py
View file @
2d8b3257
...
...
@@ -588,7 +588,7 @@ class RocmPlatform(Platform):
" is not set, enabling VLLM_USE_TRITON_AWQ."
)
envs
.
VLLM_USE_TRITON_AWQ
=
False
os
.
environ
[
"VLLM_USE_TRITON_AWQ"
]
=
"1"
#
os.environ["VLLM_USE_TRITON_AWQ"] = "1"
@
classmethod
def
get_punica_wrapper
(
cls
)
->
str
:
...
...
vllm/utils/__init__.py
View file @
2d8b3257
...
...
@@ -7,6 +7,7 @@ import uuid
import
torch
from
vllm.utils.torch_utils
import
direct_register_custom_op
MASK_64_BITS
=
(
1
<<
64
)
-
1
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment