vllm/vllm/plugins/__init__.py
youkaichao ff5ed6e1bc
[torch.compile] rework compile control with piecewise cudagraph (#9715)
Signed-off-by: youkaichao <youkaichao@gmail.com>
2024-10-29 23:03:49 -07:00

58 lines
1.7 KiB
Python

import logging
from typing import Callable, Optional, Union
import vllm.envs as envs
from vllm.compilation.config import CompilationConfig
logger = logging.getLogger(__name__)
def load_general_plugins():
"""WARNING: plugins can be loaded for multiple times in different
processes. They should be designed in a way that they can be loaded
multiple times without causing issues.
"""
import sys
if sys.version_info < (3, 10):
from importlib_metadata import entry_points
else:
from importlib.metadata import entry_points
allowed_plugins = envs.VLLM_PLUGINS
discovered_plugins = entry_points(group='vllm.general_plugins')
for plugin in discovered_plugins:
logger.info("Found general plugin: %s", plugin.name)
if allowed_plugins is None or plugin.name in allowed_plugins:
try:
func = plugin.load()
func()
logger.info("Loaded general plugin: %s", plugin.name)
except Exception:
logger.exception("Failed to load general plugin: %s",
plugin.name)
_torch_compile_backend: Optional[Union[Callable, str]] = None
def set_torch_compile_backend(backend: Union[Callable, str]):
global _torch_compile_backend
_torch_compile_backend = backend
def get_torch_compile_backend() -> Optional[Union[Callable, str]]:
return _torch_compile_backend
_compilation_config: Optional[CompilationConfig] = None
def set_compilation_config(config: Optional[CompilationConfig]):
global _compilation_config
_compilation_config = config
def get_compilation_config() -> Optional[CompilationConfig]:
return _compilation_config