mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-09 06:35:42 +08:00
Fix latency benchmark script (#2035)
This commit is contained in:
parent
beeee69bc9
commit
5dd80d3777
@ -72,7 +72,7 @@ def main(args: argparse.Namespace):
|
|||||||
# Benchmark.
|
# Benchmark.
|
||||||
latencies = []
|
latencies = []
|
||||||
for _ in tqdm(range(args.num_iters), desc="Profiling iterations"):
|
for _ in tqdm(range(args.num_iters), desc="Profiling iterations"):
|
||||||
latencies.append(run_to_completion(profile=False))
|
latencies.append(run_to_completion(profile_dir=None))
|
||||||
print(f'Avg latency: {np.mean(latencies)} seconds')
|
print(f'Avg latency: {np.mean(latencies)} seconds')
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user