From df62da8da2dea0c45558f7f044aff4e74625a963 Mon Sep 17 00:00:00 2001 From: Wei-Yu Lin Date: Tue, 16 Dec 2025 01:48:51 +0000 Subject: [PATCH] Remove tpu_int8 as it is related to deleted quantization config and implementation Signed-off-by: Wei-Yu Lin --- vllm/model_executor/layers/quantization/__init__.py | 1 - 1 file changed, 1 deletion(-) diff --git a/vllm/model_executor/layers/quantization/__init__.py b/vllm/model_executor/layers/quantization/__init__.py index 1a4378f5df3db..48db0d1bbbd47 100644 --- a/vllm/model_executor/layers/quantization/__init__.py +++ b/vllm/model_executor/layers/quantization/__init__.py @@ -11,7 +11,6 @@ logger = init_logger(__name__) QuantizationMethods = Literal[ "awq", "deepspeedfp", - "tpu_int8", "fp8", "ptpc_fp8", "fbgemm_fp8",