mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-16 15:55:55 +08:00
[caching] Add enable_prompt_embeds and cpu_offload_gb to compile hashes. (#29435)
Signed-off-by: zhxchen17 <zhxchen17@fb.com>
This commit is contained in:
parent
4e57c6587f
commit
0abc79482a
@ -167,8 +167,6 @@ class CacheConfig:
|
||||
"num_gpu_blocks_override",
|
||||
"enable_prefix_caching",
|
||||
"prefix_caching_hash_algo",
|
||||
# `cpu_offload_gb` does not use `torch.compile` yet.
|
||||
"cpu_offload_gb",
|
||||
"cpu_kvcache_space_bytes",
|
||||
"mamba_page_size_padded",
|
||||
# Post-init/derived counters
|
||||
|
||||
@ -345,7 +345,6 @@ class ModelConfig:
|
||||
"logprobs_mode",
|
||||
"disable_cascade_attn",
|
||||
"skip_tokenizer_init",
|
||||
"enable_prompt_embeds",
|
||||
"served_model_name",
|
||||
"config_format",
|
||||
"hf_token",
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user