mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-06 19:29:09 +08:00
[Bugfix] Apply same sampling parameters for both n=1 and n>1 (#26005)
Signed-off-by: Kenichi Maehashi <maehashi@preferred.jp> Signed-off-by: yewentao256 <zhyanwentao@126.com>
This commit is contained in:
parent
aeff0604bb
commit
0944358a90
@ -290,7 +290,7 @@ class AsyncLLM(EngineClient):
|
|||||||
return queue
|
return queue
|
||||||
|
|
||||||
# Fan out child requests (for n>1).
|
# Fan out child requests (for n>1).
|
||||||
parent_request = ParentRequest(request_id, params)
|
parent_request = ParentRequest(request_id, request.sampling_params)
|
||||||
for idx in range(params.n):
|
for idx in range(params.n):
|
||||||
request_id, params = parent_request.get_child_info(idx)
|
request_id, params = parent_request.get_child_info(idx)
|
||||||
child_request = request if idx == params.n - 1 else copy(request)
|
child_request = request if idx == params.n - 1 else copy(request)
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user