mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-04 12:17:06 +08:00
yapf
This commit is contained in:
parent
4cdb732cef
commit
31d05f7edb
@ -65,10 +65,10 @@ class TPUExecutor(ExecutorBase):
|
||||
"""
|
||||
# Get the maximum number of blocks that can be allocated on TPU.
|
||||
num_tpu_blocks = self.driver_worker.profile_num_available_blocks(
|
||||
block_size=self.cache_config.block_size,
|
||||
gpu_memory_utilization=self.cache_config.gpu_memory_utilization,
|
||||
cache_dtype=self.cache_config.cache_dtype,
|
||||
)
|
||||
block_size=self.cache_config.block_size,
|
||||
gpu_memory_utilization=self.cache_config.gpu_memory_utilization,
|
||||
cache_dtype=self.cache_config.cache_dtype,
|
||||
)
|
||||
logger.info(f"# TPU blocks: {num_tpu_blocks}")
|
||||
|
||||
check_block_size_valid(num_tpu_blocks, self.cache_config.block_size,
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user