mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-02 16:04:28 +08:00
[Bugfix][TPU] Fix TPU sampler output (#5978)
This commit is contained in:
parent
7041de4384
commit
54814fd85b
@ -215,7 +215,7 @@ class TPUWorker(LoraNotSupportedWorkerBase):
|
|||||||
assert len(seq_group_metadata_list) > 0
|
assert len(seq_group_metadata_list) > 0
|
||||||
output = self.model_runner.execute_model(seq_group_metadata_list,
|
output = self.model_runner.execute_model(seq_group_metadata_list,
|
||||||
self.tpu_cache)
|
self.tpu_cache)
|
||||||
return [output]
|
return output
|
||||||
|
|
||||||
def cache_swap(
|
def cache_swap(
|
||||||
self,
|
self,
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user