mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-21 02:47:02 +08:00
more cleanup
Signed-off-by: Sage Moore <sage@neuralmagic.com>
This commit is contained in:
parent
f7b6e600b8
commit
510e839429
@ -1553,6 +1553,8 @@ class GPUModelRunner(LoRAModelRunnerMixin):
|
||||
|
||||
def model_inputs(tokens_slice: slice, use_dummy_input: bool) -> tuple:
|
||||
if use_dummy_input:
|
||||
logger.info(f"NUM DUMMY TOKENS: {num_dummy_tokens} token slize: {tokens_slice}")
|
||||
assert num_dummy_tokens == tokens_slice.stop - tokens_slice.start
|
||||
return self._get_dummy_model_inputs(num_dummy_tokens)
|
||||
else:
|
||||
assert scheduler_output is not None
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user