mirror of
https://github.com/vllm-project/vllm.git
synced 2025-10-20 23:03:52 +08:00
[Core] Drop overly aggressive whisper assertion (#25408)
Signed-off-by: Russell Bryant <rbryant@redhat.com>
This commit is contained in:
@ -463,10 +463,6 @@ class Scheduler(SchedulerInterface):
|
|||||||
# always padded to the maximum length. If we support other
|
# always padded to the maximum length. If we support other
|
||||||
# encoder-decoder models, this will need to be updated if we
|
# encoder-decoder models, this will need to be updated if we
|
||||||
# want to only allocate what is needed.
|
# want to only allocate what is needed.
|
||||||
assert ("whisper"
|
|
||||||
in self.vllm_config.model_config.model.lower()), (
|
|
||||||
"Whisper is the only supported "
|
|
||||||
"encoder-decoder model.")
|
|
||||||
num_encoder_tokens =\
|
num_encoder_tokens =\
|
||||||
self.scheduler_config.max_num_encoder_input_tokens
|
self.scheduler_config.max_num_encoder_input_tokens
|
||||||
else:
|
else:
|
||||||
|
Reference in New Issue
Block a user