mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-21 15:15:45 +08:00
[Core] Drop overly aggressive whisper assertion (#25408)
Signed-off-by: Russell Bryant <rbryant@redhat.com> Signed-off-by: yewentao256 <zhyanwentao@126.com>
This commit is contained in:
parent
d96a3fc653
commit
e97cf2e32b
@ -463,10 +463,6 @@ class Scheduler(SchedulerInterface):
|
|||||||
# always padded to the maximum length. If we support other
|
# always padded to the maximum length. If we support other
|
||||||
# encoder-decoder models, this will need to be updated if we
|
# encoder-decoder models, this will need to be updated if we
|
||||||
# want to only allocate what is needed.
|
# want to only allocate what is needed.
|
||||||
assert ("whisper"
|
|
||||||
in self.vllm_config.model_config.model.lower()), (
|
|
||||||
"Whisper is the only supported "
|
|
||||||
"encoder-decoder model.")
|
|
||||||
num_encoder_tokens =\
|
num_encoder_tokens =\
|
||||||
self.scheduler_config.max_num_encoder_input_tokens
|
self.scheduler_config.max_num_encoder_input_tokens
|
||||||
else:
|
else:
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user