mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 00:15:51 +08:00
[benchmarks]allow skip ready check for bench serve (#25420)
Signed-off-by: Lu Fang <fanglu@fb.com> Signed-off-by: Lucia Fang <116399278+luccafong@users.noreply.github.com> Co-authored-by: Lucia (Lu) Fang <fanglu@meta.com>
This commit is contained in:
parent
f225ea7dd9
commit
eea1783989
@ -531,18 +531,22 @@ async def benchmark(
|
|||||||
extra_body=extra_body,
|
extra_body=extra_body,
|
||||||
)
|
)
|
||||||
|
|
||||||
test_output = await wait_for_endpoint(
|
if ready_check_timeout_sec > 0:
|
||||||
request_func,
|
test_output = await wait_for_endpoint(
|
||||||
test_input,
|
request_func,
|
||||||
session,
|
test_input,
|
||||||
timeout_seconds=ready_check_timeout_sec,
|
session,
|
||||||
)
|
timeout_seconds=ready_check_timeout_sec,
|
||||||
if not test_output.success:
|
)
|
||||||
raise ValueError(
|
if not test_output.success:
|
||||||
"Initial test run failed - Please make sure benchmark arguments "
|
raise ValueError(
|
||||||
f"are correctly specified. Error: {test_output.error}")
|
"Initial test run failed - Please make sure benchmark "
|
||||||
|
"arguments are correctly specified. "
|
||||||
|
f"Error: {test_output.error}")
|
||||||
|
else:
|
||||||
|
print("Initial test run completed. Starting main benchmark run...")
|
||||||
else:
|
else:
|
||||||
print("Initial test run completed. Starting main benchmark run...")
|
print("Skipping endpoint ready check.")
|
||||||
|
|
||||||
if lora_modules:
|
if lora_modules:
|
||||||
# For each input request, choose a LoRA module at random.
|
# For each input request, choose a LoRA module at random.
|
||||||
@ -1151,7 +1155,8 @@ def add_cli_args(parser: argparse.ArgumentParser):
|
|||||||
type=int,
|
type=int,
|
||||||
default=600,
|
default=600,
|
||||||
help="Maximum time to wait for the endpoint to become ready "
|
help="Maximum time to wait for the endpoint to become ready "
|
||||||
"in seconds (default: 600 seconds / 10 minutes).",
|
"in seconds (default: 600 seconds / 10 minutes). If set to 0, "
|
||||||
|
"the ready check will be skipped."
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user