mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-29 23:58:51 +08:00
Revert "[bench] Support common prefix len config (for decode-only bench)" (#31240)
Signed-off-by: Ming Yang <minos.future@gmail.com>
This commit is contained in:
parent
3ce791ac77
commit
3bb9561928
@ -1847,7 +1847,6 @@ def get_samples(args, tokenizer: TokenizerLike) -> list[SampleRequest]:
|
||||
random_seed=args.seed,
|
||||
dataset_path=args.dataset_path,
|
||||
disable_shuffle=args.disable_shuffle,
|
||||
prefix_len=args.common_prefix_len,
|
||||
).sample(
|
||||
tokenizer=tokenizer,
|
||||
num_requests=args.num_prompts,
|
||||
|
||||
@ -1281,12 +1281,6 @@ def add_cli_args(parser: argparse.ArgumentParser):
|
||||
help="Repetition penalty sampling parameter. Only has effect on "
|
||||
"openai-compatible backends.",
|
||||
)
|
||||
sampling_group.add_argument(
|
||||
"--common-prefix-len",
|
||||
type=int,
|
||||
default=None,
|
||||
help="Common prefix length shared by all prompts (used by random dataset)",
|
||||
)
|
||||
|
||||
parser.add_argument(
|
||||
"--served-model-name",
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user