From 2884e7f86192c287a0bcccdd57de1aae0ca35a75 Mon Sep 17 00:00:00 2001 From: Robert Shaw Date: Sun, 13 Jul 2025 15:31:58 +0000 Subject: [PATCH] updated Signed-off-by: Robert Shaw --- tools/smoke_tests/Justfile | 21 +++++++++++++++++++++ 1 file changed, 21 insertions(+) create mode 100644 tools/smoke_tests/Justfile diff --git a/tools/smoke_tests/Justfile b/tools/smoke_tests/Justfile new file mode 100644 index 0000000000000..d7d3c266dc2d7 --- /dev/null +++ b/tools/smoke_tests/Justfile @@ -0,0 +1,21 @@ +# set this on your machine +vllm-directory := "/home/rshaw/vllm/" + +launch_dp_ep MODEL SIZE: + vllm serve {{MODEL}} --data-parallel-size {{SIZE}} --enable-expert-parallel + +launch_tp MODEL SIZE: + vllm serve {{MODEL}} --tensor-parallel-size {{SIZE}} + +eval MODEL: + lm_eval --model local-completions --tasks gsm8k \ + --model_args model={{MODEL}},base_url=http://127.0.0.1:800/v1/completions,num_concurrent=100,tokenized_requests=False + +benchmark MODEL NUM_PROMPTS: + python {{vllm-directory}}/benchmarks/benchmark_serving.py \ + --model {{MODEL}} \ + --dataset-name random \ + --random-input-len 30000 \ + --random-output-len 10 \ + --num-prompts {{NUM_PROMPTS}} \ + --seed $(date +%s) \ \ No newline at end of file