Raise error for data-parallel with benchmark_throughput (#16737)

Signed-off-by: Kartik Ramesh <kartikx2000@gmail.com>
Co-authored-by: Simon Mo <simon.mo@hey.com>
This commit is contained in:
Kartik Ramesh 2025-04-21 10:51:43 -05:00 committed by GitHub
parent 55d6d3fdb8
commit 3b34fd5273
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -523,6 +523,13 @@ def validate_args(args):
raise ValueError(
"Tokenizer must be the same as the model for MII backend.")
# --data-parallel is not supported currently.
# https://github.com/vllm-project/vllm/issues/16222
if args.data_parallel_size > 1:
raise ValueError(
"Data parallel is not supported in offline benchmark, \
please use benchmark serving instead")
if __name__ == "__main__":
parser = FlexibleArgumentParser(description="Benchmark the throughput.")