mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-01-08 14:08:28 +08:00
[Misc] refactor(config): clean up unused code (#6320)
This commit is contained in:
parent
c4774eb841
commit
3963a5335b
@ -138,12 +138,10 @@ class ModelConfig:
|
||||
self.quantization = quantization
|
||||
self.quantization_param_path = quantization_param_path
|
||||
self.enforce_eager = enforce_eager
|
||||
self.max_context_len_to_capture = max_context_len_to_capture
|
||||
if self.max_context_len_to_capture is not None:
|
||||
if max_context_len_to_capture is not None:
|
||||
raise ValueError("`max_context_len_to_capture` is deprecated. "
|
||||
"Use `max_seq_len_to_capture` instead.")
|
||||
self.max_seq_len_to_capture = (max_seq_len_to_capture
|
||||
or max_context_len_to_capture)
|
||||
self.max_seq_len_to_capture = max_seq_len_to_capture
|
||||
self.max_logprobs = max_logprobs
|
||||
self.disable_sliding_window = disable_sliding_window
|
||||
self.skip_tokenizer_init = skip_tokenizer_init
|
||||
|
||||
@ -109,9 +109,6 @@ class XPUModelRunner(ModelRunnerBase[ModelInputForXPU]):
|
||||
|
||||
self.kv_cache_dtype = kv_cache_dtype
|
||||
self.block_size = cache_config.block_size
|
||||
self.max_context_len_to_capture = (
|
||||
self.model_config.max_context_len_to_capture
|
||||
if self.model_config is not None else 0)
|
||||
|
||||
self.attn_backend = get_attn_backend(
|
||||
self.model_config.get_num_attention_heads(self.parallel_config),
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user