mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-25 16:39:39 +08:00
[Core] Remove duplicate processing in async engine (#5525)
This commit is contained in:
parent
48f589e18b
commit
77490c6f2f
@ -580,21 +580,9 @@ class AsyncLLMEngine:
|
||||
if arrival_time is None:
|
||||
arrival_time = time.time()
|
||||
|
||||
if self.engine_use_ray:
|
||||
processed_inputs = await self.engine.process_model_inputs_async \
|
||||
.remote( # type: ignore
|
||||
request_id=request_id,
|
||||
inputs=inputs,
|
||||
lora_request=lora_request)
|
||||
else:
|
||||
processed_inputs = await self.engine.process_model_inputs_async(
|
||||
request_id=request_id,
|
||||
inputs=inputs,
|
||||
lora_request=lora_request)
|
||||
|
||||
stream = self._request_tracker.add_request(
|
||||
request_id,
|
||||
inputs=processed_inputs,
|
||||
inputs=inputs,
|
||||
params=params,
|
||||
arrival_time=arrival_time,
|
||||
lora_request=lora_request,
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user