mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 09:35:50 +08:00
[Bugfix] Set enable_prefix_caching=True in prefix caching example (#3703)
This commit is contained in:
parent
cb40b3ab6b
commit
c0935c96d3
@ -22,7 +22,7 @@ prompts = [
|
||||
sampling_params = SamplingParams(temperature=0.0)
|
||||
|
||||
# Create an LLM.
|
||||
llm = LLM(model="facebook/opt-125m")
|
||||
llm = LLM(model="facebook/opt-125m", enable_prefix_caching=True)
|
||||
|
||||
generating_prompts = [prefix + prompt for prompt in prompts]
|
||||
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user