diff --git a/examples/offline_inference/save_sharded_state.py b/examples/offline_inference/save_sharded_state.py index 9b154e370642..d6b8b7e6838d 100644 --- a/examples/offline_inference/save_sharded_state.py +++ b/examples/offline_inference/save_sharded_state.py @@ -29,6 +29,7 @@ import shutil from pathlib import Path from vllm import LLM, EngineArgs +from vllm.model_executor.model_loader import ShardedStateLoader from vllm.utils import FlexibleArgumentParser @@ -39,7 +40,10 @@ def parse_args(): "--output", "-o", required=True, type=str, help="path to output checkpoint" ) parser.add_argument( - "--file-pattern", type=str, help="string pattern of saved filenames" + "--file-pattern", + type=str, + default=ShardedStateLoader.DEFAULT_PATTERN, + help="string pattern of saved filenames", ) parser.add_argument( "--max-file-size",