diff --git a/tools/smoke_tests/Justfile b/tools/smoke_tests/Justfile index d7d3c266dc2d7..8ef526f4dd505 100644 --- a/tools/smoke_tests/Justfile +++ b/tools/smoke_tests/Justfile @@ -2,20 +2,20 @@ vllm-directory := "/home/rshaw/vllm/" launch_dp_ep MODEL SIZE: - vllm serve {{MODEL}} --data-parallel-size {{SIZE}} --enable-expert-parallel + vllm serve {{MODEL}} --data-parallel-size {{SIZE}} --enable-expert-parallel --disable-log-requests launch_tp MODEL SIZE: - vllm serve {{MODEL}} --tensor-parallel-size {{SIZE}} + vllm serve {{MODEL}} --tensor-parallel-size {{SIZE}} --disable-log-requests eval MODEL: lm_eval --model local-completions --tasks gsm8k \ - --model_args model={{MODEL}},base_url=http://127.0.0.1:800/v1/completions,num_concurrent=100,tokenized_requests=False + --model_args model={{MODEL}},base_url=http://127.0.0.1:8000/v1/completions,num_concurrent=100,tokenized_requests=False benchmark MODEL NUM_PROMPTS: python {{vllm-directory}}/benchmarks/benchmark_serving.py \ --model {{MODEL}} \ --dataset-name random \ - --random-input-len 30000 \ - --random-output-len 10 \ + --random-input-len 1000 \ + --random-output-len 100 \ --num-prompts {{NUM_PROMPTS}} \ - --seed $(date +%s) \ \ No newline at end of file + --seed $(date +%s) \ No newline at end of file