mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-18 05:56:58 +08:00
[MISC] Remove FP8 warning (#5472)
Co-authored-by: Philipp Moritz <pcmoritz@gmail.com>
This commit is contained in:
parent
85657b5607
commit
30299a41fa
@ -212,7 +212,7 @@ class ModelConfig:
|
|||||||
f"{self.quantization} quantization is currently not "
|
f"{self.quantization} quantization is currently not "
|
||||||
f"supported in ROCm.")
|
f"supported in ROCm.")
|
||||||
if (self.quantization
|
if (self.quantization
|
||||||
not in ["marlin", "gptq_marlin_24", "gptq_marlin"]):
|
not in ("fp8", "marlin", "gptq_marlin_24", "gptq_marlin")):
|
||||||
logger.warning(
|
logger.warning(
|
||||||
"%s quantization is not fully "
|
"%s quantization is not fully "
|
||||||
"optimized yet. The speed can be slower than "
|
"optimized yet. The speed can be slower than "
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user