mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-15 09:05:01 +08:00
use device param in load_model method (#13037)
This commit is contained in:
parent
3b05cd4555
commit
fdc5df6f54
@ -1107,7 +1107,7 @@ class GPUModelRunnerBase(ModelRunnerBase[TModelInputForGPU]):
|
|||||||
|
|
||||||
def load_model(self) -> None:
|
def load_model(self) -> None:
|
||||||
logger.info("Starting to load model %s...", self.model_config.model)
|
logger.info("Starting to load model %s...", self.model_config.model)
|
||||||
with DeviceMemoryProfiler() as m:
|
with DeviceMemoryProfiler(self.device) as m:
|
||||||
self.model = get_model(vllm_config=self.vllm_config)
|
self.model = get_model(vllm_config=self.vllm_config)
|
||||||
|
|
||||||
self.model_memory_usage = m.consumed_memory
|
self.model_memory_usage = m.consumed_memory
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user