mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-24 16:15:54 +08:00
[bench] Support common prefix len config (for decode-only bench) (#29934)
Signed-off-by: Ming Yang <minos.future@gmail.com>
This commit is contained in:
parent
65ee97288a
commit
f16356fe36
@ -1842,6 +1842,7 @@ def get_samples(args, tokenizer) -> list[SampleRequest]:
|
||||
random_seed=args.seed,
|
||||
dataset_path=args.dataset_path,
|
||||
disable_shuffle=args.disable_shuffle,
|
||||
prefix_len=args.common_prefix_len,
|
||||
).sample(
|
||||
tokenizer=tokenizer,
|
||||
num_requests=args.num_prompts,
|
||||
|
||||
@ -1221,6 +1221,12 @@ def add_cli_args(parser: argparse.ArgumentParser):
|
||||
help="Repetition penalty sampling parameter. Only has effect on "
|
||||
"openai-compatible backends.",
|
||||
)
|
||||
sampling_group.add_argument(
|
||||
"--common-prefix-len",
|
||||
type=int,
|
||||
default=None,
|
||||
help="Common prefix length shared by all prompts (used by random dataset)",
|
||||
)
|
||||
|
||||
parser.add_argument(
|
||||
"--tokenizer-mode",
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user