From 4693a3438cebd6c2f764ad67af5a85f85d03db13 Mon Sep 17 00:00:00 2001
From: Calvin Chen <45745657+calvin0327@users.noreply.github.com>
Date: Tue, 27 May 2025 15:12:02 +0800
Subject: [PATCH] [Doc] cleanup deprecated flag for doc (#18715)

Signed-off-by: calvin chen <120380290@qq.com>
---
 benchmarks/README.md | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/benchmarks/README.md b/benchmarks/README.md
index 4a8ab895e18e9..ecab570bb31c4 100644
--- a/benchmarks/README.md
+++ b/benchmarks/README.md
@@ -146,10 +146,9 @@ python3 vllm/benchmarks/benchmark_serving.py \
 
 ``` bash
 VLLM_USE_V1=1 vllm serve meta-llama/Meta-Llama-3-8B-Instruct \
-    --speculative-model "[ngram]" \
     --ngram_prompt_lookup_min 2 \
     --ngram-prompt-lookup-max 5 \
-    --num_speculative_tokens 5
+    --speculative_config '{"model": "[ngram]", "num_speculative_tokens": 5}
 ```
 
 ``` bash
@@ -274,10 +273,9 @@ python3 vllm/benchmarks/benchmark_throughput.py \
     --output-len=100 \
     --num-prompts=2048 \
     --async-engine \
-    --speculative-model="[ngram]" \
     --ngram_prompt_lookup_min=2 \
     --ngram-prompt-lookup-max=5 \
-    --num_speculative_tokens=5
+    --speculative_config '{"model": "[ngram]", "num_speculative_tokens": 5}
 ```
 
 ```