[Core] Remove duplicate processing in async engine (#5525)

This commit is contained in:
Cyrus Leung 2024-06-15 01:04:42 +08:00 committed by GitHub
parent 48f589e18b
commit 77490c6f2f
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -580,21 +580,9 @@ class AsyncLLMEngine:
if arrival_time is None:
arrival_time = time.time()
if self.engine_use_ray:
processed_inputs = await self.engine.process_model_inputs_async \
.remote( # type: ignore
request_id=request_id,
inputs=inputs,
lora_request=lora_request)
else:
processed_inputs = await self.engine.process_model_inputs_async(
request_id=request_id,
inputs=inputs,
lora_request=lora_request)
stream = self._request_tracker.add_request(
request_id,
inputs=processed_inputs,
inputs=inputs,
params=params,
arrival_time=arrival_time,
lora_request=lora_request,