mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-14 00:25:23 +08:00
[Misc] remove old comments (#4866)
This commit is contained in:
parent
e08188081b
commit
10fa9eea21
@ -887,16 +887,6 @@ class ModelRunner:
|
|||||||
# This usually takes < 10 seconds.
|
# This usually takes < 10 seconds.
|
||||||
logger.info("Graph capturing finished in %.0f secs.", elapsed_time)
|
logger.info("Graph capturing finished in %.0f secs.", elapsed_time)
|
||||||
|
|
||||||
def __del__(self) -> None:
|
|
||||||
# Delete the CUDA graphs before deleting the pynccl communicator.
|
|
||||||
# NOTE(woosuk): This is necessary because otherwise deadlocks can
|
|
||||||
# happen.
|
|
||||||
# FIXME(woosuk): This is a bit hacky. Find a more robust solution.
|
|
||||||
# TODO(youkaichao): when we get enough user feedback that pynccl is
|
|
||||||
# more stable than cupy, we can remove this, e.g. in v0.4.1.
|
|
||||||
self.graph_runners.clear()
|
|
||||||
self.pynccl_backend = None
|
|
||||||
|
|
||||||
@property
|
@property
|
||||||
def vocab_size(self) -> int:
|
def vocab_size(self) -> int:
|
||||||
return self.model_config.get_vocab_size()
|
return self.model_config.get_vocab_size()
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user