mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-12 14:27:08 +08:00
parent
7bb88b2edc
commit
7c16128106
27
benchmarks/sweep.sh
Normal file
27
benchmarks/sweep.sh
Normal file
@ -0,0 +1,27 @@
|
||||
MODEL=meta-llama/Llama-3.1-8B-Instruct
|
||||
REQUEST_RATES=(1 10 15 20)
|
||||
INPUT_LEN=1000
|
||||
OUTPUT_LEN=100
|
||||
TOTAL_SECONDS=120
|
||||
|
||||
for REQUEST_RATE in "${REQUEST_RATES[@]}";
|
||||
do
|
||||
NUM_PROMPTS=$(($TOTAL_SECONDS * $REQUEST_RATE))
|
||||
|
||||
echo ""
|
||||
echo "===== RUNNING $MODEL FOR $NUM_PROMPTS PROMPTS WITH $REQUEST_RATE QPS ====="
|
||||
echo ""
|
||||
|
||||
python3 vllm/benchmarks/benchmark_serving.py \
|
||||
--model $MODEL \
|
||||
--dataset-name random \
|
||||
--random-input-len $INPUT_LEN \
|
||||
--random-output-len $OUTPUT_LEN \
|
||||
--request-rate $REQUEST_RATE \
|
||||
--num-prompts $NUM_PROMPTS \
|
||||
--seed $REQUEST_RATE \
|
||||
--ignore-eos \
|
||||
--result-filename "$FRAMEWORK-results.json" \
|
||||
--save-result
|
||||
|
||||
done
|
||||
Loading…
x
Reference in New Issue
Block a user