[Bugfix] Set enable_prefix_caching=True in prefix caching example (#3703)

2026-07-06 16:37:15 +08:00 · 2024-03-28 16:26:30 -07:00 · 2024-03-28 16:26:30 -07:00 · c0935c96d3
commit c0935c96d3
parent cb40b3ab6b
1 changed files with 1 additions and 1 deletions
--- a/examples/offline_inference_with_prefix.py
+++ b/examples/offline_inference_with_prefix.py
@ -22,7 +22,7 @@ prompts = [
 sampling_params = SamplingParams(temperature=0.0)

 # Create an LLM.
-llm = LLM(model="facebook/opt-125m")
+llm = LLM(model="facebook/opt-125m", enable_prefix_caching=True)

 generating_prompts = [prefix + prompt for prompt in prompts]