mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 08:45:00 +08:00
[TPU] Fix the test_sampler (#17820)
This commit is contained in:
parent
ca04b97c93
commit
a463555dee
@ -26,7 +26,7 @@ def test_sampler_different(model_name: str):
|
||||
enforce_eager=False,
|
||||
max_num_seqs=1,
|
||||
max_model_len=512,
|
||||
max_num_batched_tokens=512)
|
||||
max_num_batched_tokens=256)
|
||||
prompts = [
|
||||
"Write a short story about a robot that dreams for the first time."
|
||||
]
|
||||
|
||||
@ -95,7 +95,7 @@ class PallasMetadata:
|
||||
block_tables: torch.Tensor
|
||||
context_lens: torch.Tensor
|
||||
query_start_loc: torch.Tensor
|
||||
num_seqs: int
|
||||
num_seqs: torch.Tensor
|
||||
|
||||
|
||||
class PallasAttentionBackendImpl(AttentionImpl):
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user