From 786030721efb2b85a582d65f9bb5d7197de06f83 Mon Sep 17 00:00:00 2001 From: Ning Xie Date: Tue, 4 Nov 2025 04:35:16 +0800 Subject: [PATCH] [Docs] add runai_streamer_sharded to LoadConfig (#27937) Signed-off-by: Andy Xie --- vllm/config/load.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/vllm/config/load.py b/vllm/config/load.py index d625c1ac987e7..e424f8c5edb62 100644 --- a/vllm/config/load.py +++ b/vllm/config/load.py @@ -40,6 +40,8 @@ class LoadConfig: more information.\n - "runai_streamer" will load the Safetensors weights using Run:ai Model Streamer.\n + - "runai_streamer_sharded" will load weights from pre-sharded checkpoint + files using Run:ai Model Streamer.\n - "bitsandbytes" will load the weights using bitsandbytes quantization.\n - "sharded_state" will load weights from pre-sharded checkpoint files, supporting efficient loading of tensor-parallel models.\n