mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-17 07:05:01 +08:00
[caching] Add enable_prompt_embeds and cpu_offload_gb to compile hashes. (#29435)
Signed-off-by: zhxchen17 <zhxchen17@fb.com>
This commit is contained in:
parent
4e57c6587f
commit
0abc79482a
@ -167,8 +167,6 @@ class CacheConfig:
|
|||||||
"num_gpu_blocks_override",
|
"num_gpu_blocks_override",
|
||||||
"enable_prefix_caching",
|
"enable_prefix_caching",
|
||||||
"prefix_caching_hash_algo",
|
"prefix_caching_hash_algo",
|
||||||
# `cpu_offload_gb` does not use `torch.compile` yet.
|
|
||||||
"cpu_offload_gb",
|
|
||||||
"cpu_kvcache_space_bytes",
|
"cpu_kvcache_space_bytes",
|
||||||
"mamba_page_size_padded",
|
"mamba_page_size_padded",
|
||||||
# Post-init/derived counters
|
# Post-init/derived counters
|
||||||
|
|||||||
@ -345,7 +345,6 @@ class ModelConfig:
|
|||||||
"logprobs_mode",
|
"logprobs_mode",
|
||||||
"disable_cascade_attn",
|
"disable_cascade_attn",
|
||||||
"skip_tokenizer_init",
|
"skip_tokenizer_init",
|
||||||
"enable_prompt_embeds",
|
|
||||||
"served_model_name",
|
"served_model_name",
|
||||||
"config_format",
|
"config_format",
|
||||||
"hf_token",
|
"hf_token",
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user