mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-01 10:57:13 +08:00
[bugfix] fix the default value of llm_int8_threshold in BitsAndBytesConfig (#10657)
This commit is contained in:
parent
1bf905ddaa
commit
cfb3bf25fb
@ -26,7 +26,7 @@ class BitsAndBytesConfig(QuantizationConfig):
|
|||||||
llm_int8_enable_fp32_cpu_offload: bool = False,
|
llm_int8_enable_fp32_cpu_offload: bool = False,
|
||||||
llm_int8_has_fp16_weight: bool = False,
|
llm_int8_has_fp16_weight: bool = False,
|
||||||
llm_int8_skip_modules: Optional[List[str]] = None,
|
llm_int8_skip_modules: Optional[List[str]] = None,
|
||||||
llm_int8_threshold: float = 0.0,
|
llm_int8_threshold: float = 6.0,
|
||||||
) -> None:
|
) -> None:
|
||||||
|
|
||||||
self.load_in_8bit = load_in_8bit
|
self.load_in_8bit = load_in_8bit
|
||||||
@ -103,7 +103,7 @@ class BitsAndBytesConfig(QuantizationConfig):
|
|||||||
["llm_int8_skip_modules"],
|
["llm_int8_skip_modules"],
|
||||||
default_value=[])
|
default_value=[])
|
||||||
llm_int8_threshold = get_safe_value(config, ["llm_int8_threshold"],
|
llm_int8_threshold = get_safe_value(config, ["llm_int8_threshold"],
|
||||||
default_value=0.0)
|
default_value=6.0)
|
||||||
|
|
||||||
return cls(
|
return cls(
|
||||||
load_in_8bit=load_in_8bit,
|
load_in_8bit=load_in_8bit,
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user