mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-13 02:25:36 +08:00
Don't use cupy when enforce_eager=True (#3037)
This commit is contained in:
parent
d9f726c4d0
commit
c1c0d00b88
@ -284,7 +284,10 @@ class LLMEngine:
|
|||||||
is_driver_worker=True,
|
is_driver_worker=True,
|
||||||
)
|
)
|
||||||
|
|
||||||
self._run_workers("init_model", cupy_port=get_open_port())
|
# don't use cupy for eager mode
|
||||||
|
self._run_workers("init_model",
|
||||||
|
cupy_port=get_open_port()
|
||||||
|
if not model_config.enforce_eager else None)
|
||||||
self._run_workers(
|
self._run_workers(
|
||||||
"load_model",
|
"load_model",
|
||||||
max_concurrent_workers=self.parallel_config.
|
max_concurrent_workers=self.parallel_config.
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user