mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-13 20:04:58 +08:00
Fix test_memory_usage_no_spec (#17754)
Signed-off-by: Yong Hoon Shin <yhshin@meta.com>
This commit is contained in:
parent
8a15c2603a
commit
324a3119b0
@ -42,12 +42,12 @@ we can ensure we go through the _no_spec codepath for most of our engine steps.
|
||||
|
||||
def test_memory_usage_no_spec():
|
||||
previous_memory_allocated = None
|
||||
llm = vllm.LLM(
|
||||
model=MAIN_MODEL,
|
||||
speculative_model=SPEC_MODEL,
|
||||
num_speculative_tokens=3,
|
||||
speculative_disable_by_batch_size=SPEC_DISABLE_BATCH_SIZE,
|
||||
)
|
||||
llm = vllm.LLM(model=MAIN_MODEL,
|
||||
speculative_config={
|
||||
"model": SPEC_MODEL,
|
||||
"num_speculative_tokens": 3,
|
||||
"disable_by_batch_size": SPEC_DISABLE_BATCH_SIZE,
|
||||
})
|
||||
|
||||
batch_sequences = set()
|
||||
engine = llm.llm_engine
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user