Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
184b50f7
Commit
184b50f7
authored
Jan 03, 2025
by
zhuwenwen
Browse files
fix run error
parent
28a8a733
Changes
4
Hide whitespace changes
Inline
Side-by-side
Showing
4 changed files
with
12 additions
and
3 deletions
+12
-3
vllm/model_executor/layers/sampler.py
vllm/model_executor/layers/sampler.py
+10
-0
vllm/model_executor/models/chatglm.py
vllm/model_executor/models/chatglm.py
+0
-2
vllm/platforms/__init__.py
vllm/platforms/__init__.py
+1
-0
vllm/worker/model_runner.py
vllm/worker/model_runner.py
+1
-1
No files found.
vllm/model_executor/layers/sampler.py
View file @
184b50f7
...
...
@@ -125,6 +125,16 @@ class SamplerOutput(
# Time taken in the model execute function. This will include model forward,
# block/sync across workers, cpu-gpu sync time and sampling time.
model_execute_time
:
Optional
[
float
]
=
None
# Optional lm_head logits from the model.
logits
:
Optional
[
torch
.
Tensor
]
=
None
# tree-style cartesian candidates
cart_candidates
:
Optional
[
torch
.
Tensor
]
=
None
# tree-style cartesian candidates
tree_attn_masks
:
Optional
[
torch
.
Tensor
]
=
None
def
__getitem__
(
self
,
idx
:
int
)
->
CompletionSequenceGroupOutput
:
return
self
.
outputs
[
idx
]
...
...
vllm/model_executor/models/chatglm.py
View file @
184b50f7
...
...
@@ -511,8 +511,6 @@ class ChatGLMModel(nn.Module):
def
__init__
(
self
,
*
,
vllm_config
:
VllmConfig
,
prefix
:
str
=
""
):
super
().
__init__
()
self
.
config
=
config
config
=
vllm_config
.
model_config
.
hf_config
cache_config
=
vllm_config
.
cache_config
...
...
vllm/platforms/__init__.py
View file @
184b50f7
from
.interface
import
_Backend
# noqa: F401
from
.interface
import
CpuArchEnum
,
Platform
,
PlatformEnum
,
UnspecifiedPlatform
import
torch
current_platform
:
Platform
...
...
vllm/worker/model_runner.py
View file @
184b50f7
...
...
@@ -476,7 +476,7 @@ class ModelInputForGPUBuilder(ModelRunnerInputBuilderBase[ModelInputForGPU]):
self
.
block_aligned_sliding_window
=
\
self
.
sliding_window_blocks
*
self
.
block_size
self
.
is_encoder_decoder_model
=
self
.
runner
.
model_config
.
is_encoder_decoder
_model
self
.
is_encoder_decoder_model
=
self
.
runner
.
model_config
.
is_encoder_decoder
def
_compute_lens
(
self
,
inter_data
:
InterDataForSeqGroup
,
seq_idx
:
int
,
seq_group_metadata
:
SequenceGroupMetadata
):
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment