mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-11 22:41:29 +08:00
[Core] Remove duplicate processing in async engine (#5525)
This commit is contained in:
parent
48f589e18b
commit
77490c6f2f
@ -580,21 +580,9 @@ class AsyncLLMEngine:
|
|||||||
if arrival_time is None:
|
if arrival_time is None:
|
||||||
arrival_time = time.time()
|
arrival_time = time.time()
|
||||||
|
|
||||||
if self.engine_use_ray:
|
|
||||||
processed_inputs = await self.engine.process_model_inputs_async \
|
|
||||||
.remote( # type: ignore
|
|
||||||
request_id=request_id,
|
|
||||||
inputs=inputs,
|
|
||||||
lora_request=lora_request)
|
|
||||||
else:
|
|
||||||
processed_inputs = await self.engine.process_model_inputs_async(
|
|
||||||
request_id=request_id,
|
|
||||||
inputs=inputs,
|
|
||||||
lora_request=lora_request)
|
|
||||||
|
|
||||||
stream = self._request_tracker.add_request(
|
stream = self._request_tracker.add_request(
|
||||||
request_id,
|
request_id,
|
||||||
inputs=processed_inputs,
|
inputs=inputs,
|
||||||
params=params,
|
params=params,
|
||||||
arrival_time=arrival_time,
|
arrival_time=arrival_time,
|
||||||
lora_request=lora_request,
|
lora_request=lora_request,
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user