diff --git a/vllm/model_executor/layers/quantization/__init__.py b/vllm/model_executor/layers/quantization/__init__.py index 1a4378f5df3db..48db0d1bbbd47 100644 --- a/vllm/model_executor/layers/quantization/__init__.py +++ b/vllm/model_executor/layers/quantization/__init__.py @@ -11,7 +11,6 @@ logger = init_logger(__name__) QuantizationMethods = Literal[ "awq", "deepspeedfp", - "tpu_int8", "fp8", "ptpc_fp8", "fbgemm_fp8",