mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-05 11:54:26 +08:00
Increase #blocks
This commit is contained in:
parent
f42b4c27d8
commit
5323969fcf
@ -64,7 +64,7 @@ class TPUWorker(LoraNotSupportedWorkerBase):
|
|||||||
self.model_runner.load_model()
|
self.model_runner.load_model()
|
||||||
|
|
||||||
def determine_num_available_blocks(self) -> Tuple[int, int]:
|
def determine_num_available_blocks(self) -> Tuple[int, int]:
|
||||||
num_tpu_blocks = 100
|
num_tpu_blocks = 1000
|
||||||
return num_tpu_blocks, 0
|
return num_tpu_blocks, 0
|
||||||
|
|
||||||
def initialize_cache(
|
def initialize_cache(
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user