Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
66b809cc
Commit
66b809cc
authored
Feb 08, 2025
by
zhuwenwen
Browse files
Merge tag 'v0.7.2' into v0.7.2-dev
parents
37b63c24
0408efc6
Changes
1000
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
40 additions
and
0 deletions
+40
-0
vllm/spec_decode/medusa_worker.py
vllm/spec_decode/medusa_worker.py
+2
-0
vllm/spec_decode/metrics.py
vllm/spec_decode/metrics.py
+2
-0
vllm/spec_decode/mlp_speculator_worker.py
vllm/spec_decode/mlp_speculator_worker.py
+2
-0
vllm/spec_decode/mqa_scorer.py
vllm/spec_decode/mqa_scorer.py
+2
-0
vllm/spec_decode/multi_step_worker.py
vllm/spec_decode/multi_step_worker.py
+2
-0
vllm/spec_decode/ngram_worker.py
vllm/spec_decode/ngram_worker.py
+2
-0
vllm/spec_decode/proposer_worker_base.py
vllm/spec_decode/proposer_worker_base.py
+2
-0
vllm/spec_decode/smaller_tp_proposer_worker.py
vllm/spec_decode/smaller_tp_proposer_worker.py
+2
-0
vllm/spec_decode/spec_decode_worker.py
vllm/spec_decode/spec_decode_worker.py
+2
-0
vllm/spec_decode/target_model_runner.py
vllm/spec_decode/target_model_runner.py
+2
-0
vllm/spec_decode/top1_proposer.py
vllm/spec_decode/top1_proposer.py
+2
-0
vllm/spec_decode/util.py
vllm/spec_decode/util.py
+2
-0
vllm/tracing.py
vllm/tracing.py
+2
-0
vllm/transformers_utils/__init__.py
vllm/transformers_utils/__init__.py
+2
-0
vllm/transformers_utils/config.py
vllm/transformers_utils/config.py
+2
-0
vllm/transformers_utils/configs/__init__.py
vllm/transformers_utils/configs/__init__.py
+2
-0
vllm/transformers_utils/configs/arctic.py
vllm/transformers_utils/configs/arctic.py
+2
-0
vllm/transformers_utils/configs/chatglm.py
vllm/transformers_utils/configs/chatglm.py
+2
-0
vllm/transformers_utils/configs/cohere2.py
vllm/transformers_utils/configs/cohere2.py
+2
-0
vllm/transformers_utils/configs/dbrx.py
vllm/transformers_utils/configs/dbrx.py
+2
-0
No files found.
Too many changes to show.
To preserve performance only
1000 of 1000+
files are displayed.
Plain diff
Email patch
vllm/spec_decode/medusa_worker.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
os
import
weakref
from
typing
import
List
,
Optional
,
Set
,
Tuple
,
Dict
...
...
vllm/spec_decode/metrics.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
time
from
typing
import
Callable
,
Optional
,
Union
...
...
vllm/spec_decode/mlp_speculator_worker.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
from
typing
import
List
,
Optional
,
Set
,
Tuple
,
Dict
import
torch
...
...
vllm/spec_decode/mqa_scorer.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
from
vllm.sequence
import
(
ExecuteModelRequest
,
SequenceData
,
SequenceGroupMetadata
,
get_all_seq_ids
)
from
vllm.spec_decode.interfaces
import
(
SpeculativeProposals
,
...
...
vllm/spec_decode/multi_step_worker.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
copy
import
weakref
from
typing
import
Dict
,
List
,
Set
,
Tuple
...
...
vllm/spec_decode/ngram_worker.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
weakref
from
typing
import
List
,
Optional
,
Set
,
Tuple
...
...
vllm/spec_decode/proposer_worker_base.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
from
abc
import
ABC
,
abstractmethod
from
typing
import
List
,
Optional
,
Set
,
Tuple
...
...
vllm/spec_decode/smaller_tp_proposer_worker.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
from
typing
import
List
,
Optional
,
Set
,
Tuple
import
torch
...
...
vllm/spec_decode/spec_decode_worker.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
os
import
copy
from
collections
import
defaultdict
...
...
vllm/spec_decode/target_model_runner.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
from
typing
import
List
,
Optional
from
vllm.sequence
import
SequenceGroupMetadata
...
...
vllm/spec_decode/top1_proposer.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
from
typing
import
List
,
Optional
,
Set
,
Tuple
import
torch
...
...
vllm/spec_decode/util.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
time
from
contextlib
import
contextmanager
from
typing
import
Dict
,
List
,
Optional
,
Sequence
,
Tuple
...
...
vllm/tracing.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
os
from
typing
import
Mapping
,
Optional
...
...
vllm/transformers_utils/__init__.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
from
vllm.envs
import
VLLM_USE_MODELSCOPE
if
VLLM_USE_MODELSCOPE
:
...
...
vllm/transformers_utils/config.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
import
enum
import
json
import
os
...
...
vllm/transformers_utils/configs/__init__.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
from
vllm.transformers_utils.configs.chatglm
import
ChatGLMConfig
from
vllm.transformers_utils.configs.cohere2
import
Cohere2Config
from
vllm.transformers_utils.configs.dbrx
import
DbrxConfig
...
...
vllm/transformers_utils/configs/arctic.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
# yapf: disable
# ruff: noqa: E501
# coding=utf-8
...
...
vllm/transformers_utils/configs/chatglm.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
# Adapted from
# https://github.com/THUDM/ChatGLM2-6B
from
transformers
import
PretrainedConfig
...
...
vllm/transformers_utils/configs/cohere2.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
# ruff: noqa
# Adapted from
...
...
vllm/transformers_utils/configs/dbrx.py
View file @
66b809cc
# SPDX-License-Identifier: Apache-2.0
# yapf: disable
# ruff: noqa: E501
# coding=utf-8
...
...
Prev
1
…
46
47
48
49
50
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment