mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-13 21:45:25 +08:00
[Bugfix] Disable prefix caching by default for benchmark (#18771)
Signed-off-by: cascade812 <cascade812@outlook.com>
This commit is contained in:
parent
e56f44d9ec
commit
51e98e4ffd
@ -82,7 +82,7 @@ def add_cli_args(parser: argparse.ArgumentParser):
|
|||||||
parser = EngineArgs.add_cli_args(parser)
|
parser = EngineArgs.add_cli_args(parser)
|
||||||
# V1 enables prefix caching by default which skews the latency
|
# V1 enables prefix caching by default which skews the latency
|
||||||
# numbers. We need to disable prefix caching by default.
|
# numbers. We need to disable prefix caching by default.
|
||||||
parser.set_defaults(enable_prefix_caching=True)
|
parser.set_defaults(enable_prefix_caching=False)
|
||||||
|
|
||||||
|
|
||||||
def main(args: argparse.Namespace):
|
def main(args: argparse.Namespace):
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user