mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-14 19:05:35 +08:00
[Intel GPU] support ray as distributed executor backend for XPU. (#20659)
Signed-off-by: Kunshang Ji <kunshang.ji@intel.com>
This commit is contained in:
parent
e760fcef22
commit
b6e7e3d58f
@ -27,6 +27,8 @@ docker run \
|
|||||||
"${image_name}" \
|
"${image_name}" \
|
||||||
sh -c '
|
sh -c '
|
||||||
VLLM_USE_V1=1 python3 examples/offline_inference/basic/generate.py --model facebook/opt-125m --block-size 64 --enforce-eager
|
VLLM_USE_V1=1 python3 examples/offline_inference/basic/generate.py --model facebook/opt-125m --block-size 64 --enforce-eager
|
||||||
|
VLLM_USE_V1=1 python3 examples/offline_inference/basic/generate.py --model facebook/opt-125m --block-size 64 --enforce-eager -tp 2 --distributed-executor-backend ray
|
||||||
|
VLLM_USE_V1=1 python3 examples/offline_inference/basic/generate.py --model facebook/opt-125m --block-size 64 --enforce-eager -tp 2 --distributed-executor-backend mp
|
||||||
cd tests
|
cd tests
|
||||||
pytest -v -s v1/core
|
pytest -v -s v1/core
|
||||||
'
|
'
|
||||||
|
|||||||
@ -62,7 +62,7 @@ class RayDistributedExecutor(DistributedExecutorBase):
|
|||||||
|
|
||||||
def _init_executor(self) -> None:
|
def _init_executor(self) -> None:
|
||||||
self.forward_dag: Optional[ray.dag.CompiledDAG] = None
|
self.forward_dag: Optional[ray.dag.CompiledDAG] = None
|
||||||
if envs.VLLM_USE_V1 and not current_platform.is_xpu():
|
if envs.VLLM_USE_V1:
|
||||||
# V1 uses SPMD worker and compiled DAG
|
# V1 uses SPMD worker and compiled DAG
|
||||||
os.environ["VLLM_USE_RAY_SPMD_WORKER"] = "1"
|
os.environ["VLLM_USE_RAY_SPMD_WORKER"] = "1"
|
||||||
os.environ["VLLM_USE_RAY_COMPILED_DAG"] = "1"
|
os.environ["VLLM_USE_RAY_COMPILED_DAG"] = "1"
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user