mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-14 05:25:20 +08:00
[Bugfix] Offline example of disaggregated prefill (#13214)
This commit is contained in:
parent
067678262a
commit
84683fa271
@ -22,7 +22,7 @@ def run_prefill(prefill_done):
|
|||||||
# and 3 and do prefilling on request 2.
|
# and 3 and do prefilling on request 2.
|
||||||
prompts = [
|
prompts = [
|
||||||
"Hello, my name is",
|
"Hello, my name is",
|
||||||
# "Hi, your name is",
|
"Hi, your name is",
|
||||||
# The decode node will actually "prefill" this request.
|
# The decode node will actually "prefill" this request.
|
||||||
"Tell me a very long story",
|
"Tell me a very long story",
|
||||||
]
|
]
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user