Correctly kill vLLM processes after finishing serving benchmarks (#21641)

Signed-off-by: Huy Do <huydhn@gmail.com>
2026-07-09 10:57:10 +08:00 · 2025-07-25 19:06:21 -07:00 · 2025-07-25 19:06:21 -07:00 · a55c95096b
commit a55c95096b
parent 97349fe2bc
1 changed files with 8 additions and 6 deletions
--- a/.buildkite/nightly-benchmarks/scripts/run-nightly-benchmarks.sh
+++ b/.buildkite/nightly-benchmarks/scripts/run-nightly-benchmarks.sh
@ -95,12 +95,14 @@ json2args() {
 }
 kill_gpu_processes() {
-  pkill -f python
+  pkill -f '[p]ython'
-  pkill -f python3
+  pkill -f '[p]ython3'
-  pkill -f tritonserver
+  pkill -f '[t]ritonserver'
-  pkill -f pt_main_thread
+  pkill -f '[p]t_main_thread'
-  pkill -f text-generation
+  pkill -f '[t]ext-generation'
-  pkill -f lmdeploy
+  pkill -f '[l]mdeploy'
  # vLLM now names the process with VLLM prefix after https://github.com/vllm-project/vllm/pull/21445
  pkill -f '[V]LLM'
  while [ "$(nvidia-smi --query-gpu=memory.used --format=csv,noheader,nounits | head -n 1)" -ge 1000 ]; do
    sleep 1