Increase #blocks

This commit is contained in:
Woosuk Kwon 2024-04-24 08:56:58 +00:00
parent f42b4c27d8
commit 5323969fcf

View File

@ -64,7 +64,7 @@ class TPUWorker(LoraNotSupportedWorkerBase):
self.model_runner.load_model()
def determine_num_available_blocks(self) -> Tuple[int, int]:
num_tpu_blocks = 100
num_tpu_blocks = 1000
return num_tpu_blocks, 0
def initialize_cache(