mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-15 10:26:11 +08:00
[Bugfix] Fix boolean conversion for OpenVINO env variable (#13615)
This commit is contained in:
parent
8354f6640c
commit
382f66fb08
@ -360,8 +360,9 @@ environment_variables: Dict[str, Callable[[], Any]] = {
|
|||||||
# Enables weights compression during model export via HF Optimum
|
# Enables weights compression during model export via HF Optimum
|
||||||
# default is False
|
# default is False
|
||||||
"VLLM_OPENVINO_ENABLE_QUANTIZED_WEIGHTS":
|
"VLLM_OPENVINO_ENABLE_QUANTIZED_WEIGHTS":
|
||||||
lambda: bool(os.getenv("VLLM_OPENVINO_ENABLE_QUANTIZED_WEIGHTS", False)),
|
lambda:
|
||||||
|
(os.environ.get("VLLM_OPENVINO_ENABLE_QUANTIZED_WEIGHTS", "0").lower() in
|
||||||
|
("on", "true", "1")),
|
||||||
# If the env var is set, then all workers will execute as separate
|
# If the env var is set, then all workers will execute as separate
|
||||||
# processes from the engine, and we use the same mechanism to trigger
|
# processes from the engine, and we use the same mechanism to trigger
|
||||||
# execution on all workers.
|
# execution on all workers.
|
||||||
|
|||||||
@ -125,7 +125,8 @@ class OpenVINOCausalLM(nn.Module):
|
|||||||
"as-is, all possible options that may affect model conversion "
|
"as-is, all possible options that may affect model conversion "
|
||||||
"are ignored.")
|
"are ignored.")
|
||||||
|
|
||||||
load_in_8bit = envs.VLLM_OPENVINO_ENABLE_QUANTIZED_WEIGHTS
|
load_in_8bit = (envs.VLLM_OPENVINO_ENABLE_QUANTIZED_WEIGHTS
|
||||||
|
if export else False)
|
||||||
pt_model = OVModelForCausalLM.from_pretrained(
|
pt_model = OVModelForCausalLM.from_pretrained(
|
||||||
model_config.model,
|
model_config.model,
|
||||||
export=export,
|
export=export,
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user