mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-03 09:17:03 +08:00
fix dp proxy
Signed-off-by: inkcherry <mingzhi.liu@amd.com>
This commit is contained in:
parent
f8e9adfea8
commit
68a2333339
@ -218,7 +218,9 @@ async def handle_request():
|
||||
req_data['kv_transfer_params']['remote_dp_size'] = prefill_instance_endpoint['dp_size']
|
||||
req_data['kv_transfer_params']['remote_tp_size'] = prefill_instance_endpoint['tp_size']
|
||||
|
||||
|
||||
if selected_prefill_dp_rank is not None:
|
||||
req_data['kv_transfer_params']['remote_dp_rank'] = selected_prefill_dp_rank
|
||||
|
||||
decode_request_task = asyncio.create_task(
|
||||
start_decode_request(decode_instance_endpoint['request_address'], req_data, request_id)
|
||||
)
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user