mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 04:05:01 +08:00
[Misc] SpecDecodeWorker supports profiling (#9719)
Signed-off-by: Abatom <abatom@163.com>
This commit is contained in:
parent
6650e6a930
commit
67a6882da4
@ -1038,6 +1038,14 @@ class SpecDecodeWorker(LoraNotSupportedWorkerBase):
|
|||||||
"""
|
"""
|
||||||
raise NotImplementedError
|
raise NotImplementedError
|
||||||
|
|
||||||
|
def start_profile(self):
|
||||||
|
if isinstance(self.scorer_worker, Worker):
|
||||||
|
self.scorer_worker.start_profile()
|
||||||
|
|
||||||
|
def stop_profile(self):
|
||||||
|
if isinstance(self.scorer_worker, Worker):
|
||||||
|
self.scorer_worker.stop_profile()
|
||||||
|
|
||||||
|
|
||||||
def split_num_cache_blocks_evenly(scorer_cache_block_size_bytes: int,
|
def split_num_cache_blocks_evenly(scorer_cache_block_size_bytes: int,
|
||||||
proposer_cache_block_size_bytes: int,
|
proposer_cache_block_size_bytes: int,
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user