This commit is contained in:
Chaofan Lin 2023-08-01 04:11:57 +08:00 committed by GitHub
parent 953f28cf9a
commit aa39e42c5a
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
2 changed files with 2 additions and 2 deletions

View File

@ -224,7 +224,7 @@ class SchedulerConfig:
a single iteration.
max_num_seqs: Maximum number of sequences to be processed in a single
iteration.
max_seq_len: Maximum length of a sequence (including prompt
max_model_len: Maximum length of a sequence (including prompt
and generated text).
"""

View File

@ -353,7 +353,7 @@ class LLMEngine:
if stopped:
continue
# Check if the sequence has reached max_seq_len.
# Check if the sequence has reached max_model_len.
if seq.get_len() > self.scheduler_config.max_model_len:
self.scheduler.free_seq(
seq, SequenceStatus.FINISHED_LENGTH_CAPPED)