Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
0abc7948
Unverified
Commit
0abc7948
authored
Nov 25, 2025
by
Zhengxu Chen
Committed by
GitHub
Nov 25, 2025
Browse files
[caching] Add enable_prompt_embeds and cpu_offload_gb to compile hashes. (#29435)
Signed-off-by:
zhxchen17
<
zhxchen17@fb.com
>
parent
4e57c658
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
1 addition
and
4 deletions
+1
-4
vllm/config/cache.py
vllm/config/cache.py
+1
-3
vllm/config/model.py
vllm/config/model.py
+0
-1
No files found.
vllm/config/cache.py
View file @
0abc7948
...
@@ -144,7 +144,7 @@ class CacheConfig:
...
@@ -144,7 +144,7 @@ class CacheConfig:
kv_offloading_backend
:
KVOffloadingBackend
|
None
=
None
kv_offloading_backend
:
KVOffloadingBackend
|
None
=
None
"""The backend to use for KV cache offloading. Supported backends include
"""The backend to use for KV cache offloading. Supported backends include
'native' (vLLM native CPU offloading), 'lmcache' This option must be used
'native' (vLLM native CPU offloading), 'lmcache' This option must be used
together with kv_offloading_size."""
together with kv_offloading_size."""
def
compute_hash
(
self
)
->
str
:
def
compute_hash
(
self
)
->
str
:
...
@@ -167,8 +167,6 @@ class CacheConfig:
...
@@ -167,8 +167,6 @@ class CacheConfig:
"num_gpu_blocks_override"
,
"num_gpu_blocks_override"
,
"enable_prefix_caching"
,
"enable_prefix_caching"
,
"prefix_caching_hash_algo"
,
"prefix_caching_hash_algo"
,
# `cpu_offload_gb` does not use `torch.compile` yet.
"cpu_offload_gb"
,
"cpu_kvcache_space_bytes"
,
"cpu_kvcache_space_bytes"
,
"mamba_page_size_padded"
,
"mamba_page_size_padded"
,
# Post-init/derived counters
# Post-init/derived counters
...
...
vllm/config/model.py
View file @
0abc7948
...
@@ -345,7 +345,6 @@ class ModelConfig:
...
@@ -345,7 +345,6 @@ class ModelConfig:
"logprobs_mode"
,
"logprobs_mode"
,
"disable_cascade_attn"
,
"disable_cascade_attn"
,
"skip_tokenizer_init"
,
"skip_tokenizer_init"
,
"enable_prompt_embeds"
,
"served_model_name"
,
"served_model_name"
,
"config_format"
,
"config_format"
,
"hf_token"
,
"hf_token"
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment