Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
9480ae24
Unverified
Commit
9480ae24
authored
Sep 02, 2025
by
Kyuyeun Kim
Committed by
GitHub
Sep 02, 2025
Browse files
[Bugfix] Fix packed_factor missing attribute error (#23902)
Signed-off-by:
Kyuyeun Kim
<
kyuyeunk@google.com
>
parent
f399182e
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
8 additions
and
8 deletions
+8
-8
vllm/model_executor/layers/linear.py
vllm/model_executor/layers/linear.py
+8
-8
No files found.
vllm/model_executor/layers/linear.py
View file @
9480ae24
...
...
@@ -722,8 +722,8 @@ class MergedColumnParallelLinear(ColumnParallelLinear):
# If quantized, we need to adjust the offset and size to account
# for the packing.
if
packed_dim
==
output_dim
:
shard_size
=
shard_size
//
param
.
pack_factor
shard_offset
=
shard_offset
//
param
.
pack_factor
shard_size
=
shard_size
//
param
.
pack
ed
_factor
shard_offset
=
shard_offset
//
param
.
pack
ed
_factor
# Special case for Marlin.
shard_size
,
shard_offset
=
adjust_marlin_shard
(
param
,
shard_size
,
shard_offset
)
...
...
@@ -756,8 +756,8 @@ class MergedColumnParallelLinear(ColumnParallelLinear):
# for the packing.
packed_dim
=
getattr
(
param
,
"packed_dim"
,
None
)
if
packed_dim
==
output_dim
:
shard_size
=
shard_size
//
param
.
pack_factor
shard_offset
=
shard_offset
//
param
.
pack_factor
shard_size
=
shard_size
//
param
.
pack
ed
_factor
shard_offset
=
shard_offset
//
param
.
pack
ed
_factor
# Special case for Marlin.
shard_size
,
shard_offset
=
adjust_marlin_shard
(
param
,
shard_size
,
shard_offset
)
...
...
@@ -1107,8 +1107,8 @@ class QKVParallelLinear(ColumnParallelLinear):
# If quantized, we need to adjust the offset and size to account
# for the packing.
if
packed_dim
==
output_dim
:
shard_size
=
shard_size
//
param
.
pack_factor
shard_offset
=
shard_offset
//
param
.
pack_factor
shard_size
=
shard_size
//
param
.
pack
ed
_factor
shard_offset
=
shard_offset
//
param
.
pack
ed
_factor
# Special case for Marlin.
shard_size
,
shard_offset
=
adjust_marlin_shard
(
...
...
@@ -1155,8 +1155,8 @@ class QKVParallelLinear(ColumnParallelLinear):
# for the packing.
packed_dim
=
getattr
(
param
,
"packed_dim"
,
None
)
if
packed_dim
==
output_dim
:
shard_size
=
shard_size
//
param
.
pack_factor
shard_offset
=
shard_offset
//
param
.
pack_factor
shard_size
=
shard_size
//
param
.
pack
ed
_factor
shard_offset
=
shard_offset
//
param
.
pack
ed
_factor
# Special case for Marlin.
shard_size
,
shard_offset
=
adjust_marlin_shard
(
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment