diff --git a/benchmarks/benchmark_serving.py b/benchmarks/benchmark_serving.py index 7d389a9c7d70..3f5e2d9c8f4d 100644 --- a/benchmarks/benchmark_serving.py +++ b/benchmarks/benchmark_serving.py @@ -12,7 +12,7 @@ On the server side, run one of the following commands: On the client side, run: python benchmarks/benchmark_serving.py \ --backend \ - --tokenizer --dataset \ + --model --dataset \ --request-rate """ import argparse @@ -171,10 +171,10 @@ async def benchmark( else: raise ValueError(f"Unknown backend: {backend}") - pbar = None if disable_tqdm else tqdm(total=len(input_requests)) - print(f"Traffic request rate: {request_rate}") + pbar = None if disable_tqdm else tqdm(total=len(input_requests)) + benchmark_start_time = time.perf_counter() tasks = [] async for request in get_request(input_requests, request_rate):