mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-25 10:16:32 +08:00
[Misc] Do not print async output warning for v1 (#21151)
Signed-off-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
This commit is contained in:
parent
5780121c95
commit
54cf1cae62
@ -99,7 +99,7 @@ class CudaPlatformBase(Platform):
|
||||
|
||||
@classmethod
|
||||
def is_async_output_supported(cls, enforce_eager: Optional[bool]) -> bool:
|
||||
if enforce_eager:
|
||||
if enforce_eager and not envs.VLLM_USE_V1:
|
||||
logger.warning(
|
||||
"To see benefits of async output processing, enable CUDA "
|
||||
"graph. Since, enforce-eager is enabled, async output "
|
||||
|
||||
@ -299,7 +299,7 @@ class RocmPlatform(Platform):
|
||||
|
||||
@classmethod
|
||||
def is_async_output_supported(cls, enforce_eager: Optional[bool]) -> bool:
|
||||
if enforce_eager:
|
||||
if enforce_eager and not envs.VLLM_USE_V1:
|
||||
logger.warning(
|
||||
"To see benefits of async output processing, enable CUDA "
|
||||
"graph. Since, enforce-eager is enabled, async output "
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user